Tensor2Tensor Hparams,dkl_weight,dkl_weight_fn,dkl_weight_start,dkl_weight_diff,regularization,MOSES BLEU:0.0,Sparsity:0.0,MOSES BLEU:0.5,Sparsity:0.5,MOSES BLEU:1.0,Sparsity:1.0,MOSES BLEU:1.5,Sparsity:1.5,MOSES BLEU:2.0,Sparsity:2.0,MOSES BLEU:2.5,Sparsity:2.5,MOSES BLEU:3.0,Sparsity:3.0,MOSES BLEU:3.5,Sparsity:3.5,MOSES BLEU:4.0,Sparsity:4.0,MOSES BLEU:4.5,Sparsity:4.5,MOSES BLEU:5.0,Sparsity:5.0
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,1,dropout+label_smoothing,0.17,0.986346125603,0.44,0.984580338001,1.57,0.982562661171,10.67,0.979774355888,14.6,0.975349605083,15.35,0.96807706356,15.44,0.955967605114,15.45,0.935014009476,15.44,0.898874878883,15.38,0.845711350441,15.34,0.786605417728
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,1,label_smoothing,0.09,0.988330602646,0.33,0.986961901188,5.87,0.985273182392,12.06,0.982702553272,14.45,0.978415071964,15.76,0.971229493618,15.77,0.959120571613,15.82,0.937592446804,16.01,0.899801254272,15.92,0.845586359501,15.91,0.788092434406
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,1,none,0.46,0.98657220602,3.46,0.985141038895,8.94,0.983271241188,13.55,0.980304121971,15.8,0.975234508514,16.25,0.966760158539,16.58,0.952479183674,16.77,0.927970409393,16.6,0.887782692909,16.42,0.832683682442,16.58,0.774847090244
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,1,dropout+label_smoothing,0.3,0.981532037258,0.5,0.979071855545,6.02,0.976066291332,14.9,0.971729874611,15.99,0.964815616608,16.17,0.953694701195,16.06,0.935862779617,16.16,0.906573712826,16.11,0.86001688242,16.2,0.799876272678,16.18,0.741144120693
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,1,label_smoothing,0.22,0.984102427959,2.37,0.981932461262,10.9,0.97909039259,14.71,0.974776446819,16.72,0.967729866505,17.01,0.95644056797,16.98,0.938254654408,17.02,0.908026814461,17.1,0.859698951244,17.07,0.798654317856,17.13,0.740989685059
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,1,none,0.43,0.981700360775,5.15,0.979586660862,12.99,0.976656794548,16.2,0.971890985966,17.37,0.963995099068,17.24,0.951097607613,17.12,0.930234491825,17.23,0.8968719244,17.27,0.846957683563,17.12,0.78643733263,17.24,0.729794919491
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,1,dropout+label_smoothing,0.26,0.969819545746,3.53,0.965808868408,15.29,0.960480034351,18.04,0.952258706093,18.57,0.939303159714,18.71,0.919670462608,18.75,0.890541434288,18.8,0.84766471386,18.75,0.789300978184,18.79,0.727352917194,18.77,0.675083875656
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,1,label_smoothing,4.15,0.974063277245,9.43,0.971220374107,15.31,0.966944217682,17.56,0.959616303444,18.32,0.94733530283,18.71,0.927926659584,18.85,0.898262798786,18.95,0.853741049767,19,0.794174253941,19.04,0.734262347221,18.98,0.685565173626
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,1,none,2.64,0.971424758434,9.27,0.968702316284,15.68,0.96429002285,18.62,0.95638948679,19.57,0.942880570889,19.73,0.921423792839,19.74,0.888849854469,20.04,0.841534554958,19.94,0.779702067375,19.88,0.716514289379,19.95,0.663717806339
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,1,dropout+label_smoothing,0.84,0.901050984859,14.8,0.886287868023,21.83,0.863945186138,22.82,0.830906629562,23.35,0.786256670952,23.42,0.730647087097,23.54,0.665379106998,23.46,0.591528713703,23.47,0.519375503063,23.5,0.45982336998,23.45,0.411622792482
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,1,label_smoothing,1.44,0.916776537895,13.39,0.905971109867,21.39,0.887580394745,23.01,0.858301103115,23.37,0.81697177887,23.53,0.763918817043,23.52,0.699788510799,23.67,0.626482963562,23.61,0.556923270226,23.65,0.50025087595,23.7,0.454339206219
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,1,none,7.38,0.910223305225,19.08,0.898855686188,22.05,0.879303812981,23.02,0.848665714264,23.44,0.805622339249,23.62,0.750821709633,23.63,0.686384797096,23.64,0.614673435688,23.63,0.544630467892,23.57,0.486613631248,23.66,0.440194606781
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,100000,dropout+label_smoothing,0.34,0.978602707386,0.26,0.97527629137,0.22,0.971750199795,0.63,0.967432081699,11.4,0.960884571075,18.27,0.949682056904,18.78,0.930636465549,18.87,0.897658467293,18.95,0.83982360363,18.98,0.760839998722,18.99,0.678691267967
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,100000,label_smoothing,0.17,0.981338858604,0.14,0.978820860386,0.16,0.975905418396,0.69,0.972003400326,12.3,0.965618610382,18.08,0.954342246056,19.2,0.935123205185,19.61,0.900906682014,19.84,0.841275572777,19.89,0.764547586441,19.94,0.688831627369
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,100000,none,0,0.978577256203,0,0.976146221161,0.1,0.973309457302,2.43,0.969321012497,15.94,0.962420165539,18.94,0.95010215044,19.73,0.928952097893,20.07,0.892266094685,20.22,0.83123844862,20.37,0.75322508812,20.4,0.676430344582
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,100000,dropout+label_smoothing,0.13,0.981196939945,0.2,0.978444099426,0.48,0.975412070751,2.86,0.971432745457,15.61,0.965027809143,17.83,0.954044520855,18.11,0.935930609703,18.46,0.905616283417,18.55,0.853324234486,18.46,0.778569221497,18.47,0.698907256126
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,100000,label_smoothing,0.16,0.983509838581,0.1,0.981242239475,0.37,0.978577971458,1.17,0.974957883358,12.2,0.968953192234,17.78,0.95828127861,18.75,0.940214216709,19.02,0.908816933632,19.34,0.853991091251,19.31,0.780685901642,19.51,0.707741081715
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,100000,none,0,0.981253445148,0.09,0.979300677776,0.29,0.976948201656,3.25,0.973442137241,16.31,0.967119038105,18.69,0.955749094486,19.4,0.93629771471,19.69,0.902801096439,19.76,0.846929371357,19.85,0.773501038551,19.96,0.700529456139
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,100000,dropout+label_smoothing,0.09,0.966984570026,0.15,0.963142335415,0.25,0.958782911301,0.93,0.953103005886,13.37,0.944307804108,18.58,0.929417312145,19.33,0.903405964375,19.62,0.854355871677,19.68,0.779354214668,19.74,0.688567638397,19.74,0.589260578156
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,100000,label_smoothing,0.05,0.967726230621,0.06,0.965271472931,0.08,0.962210774422,0.41,0.957726061344,7.85,0.949978113174,18.19,0.936137139797,19.86,0.910125255585,20.42,0.858656644821,20.56,0.782087922096,20.7,0.690541386604,20.8,0.590266227722
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,100000,none,0,0.966085135937,0,0.963342726231,0.06,0.959896743298,0.6,0.954852163792,11.23,0.946222662926,19.46,0.931183934212,20.53,0.904558300972,20.82,0.854869902134,20.89,0.777423501015,21.11,0.682089805603,21.11,0.579207479954
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,100000,dropout+label_smoothing,0.11,0.968895375729,0.18,0.965402245522,0.24,0.96145260334,1.27,0.956212222576,15.42,0.947817802429,18.61,0.933557331562,19.43,0.908547639847,19.59,0.860632836819,19.63,0.785073518753,19.79,0.692577898502,19.85,0.591127455235
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,100000,label_smoothing,0.13,0.97000002861,0,0.967741549015,0.26,0.964904308319,1.72,0.96070766449,12.11,0.953308999538,18.66,0.939930558205,19.86,0.914768278599,20.32,0.864111840725,20.46,0.786220729351,20.43,0.692279458046,20.44,0.589439868927
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,100000,none,0,0.968144237995,0,0.965707302094,0.07,0.962634563446,1.27,0.957964479923,15.07,0.949725210667,19.5,0.935137629509,20.57,0.909030735493,20.75,0.859765172005,20.85,0.78143465519,21.09,0.684354126453,21.13,0.579205513
sparse_transformer_variational_dropout,2.22222222222e-7,linear,200000,100000,dropout+label_smoothing,0.05,0.955271065235,0.12,0.95153260231,0.35,0.946879029274,3.94,0.940264105797,18,0.929801702499,19.37,0.912584245205,19.81,0.880502343178,19.98,0.824151754379,20.12,0.746223032475,20.15,0.650751709938,20.13,0.543239176273
sparse_transformer_variational_dropout,2.22222222222e-7,linear,200000,100000,label_smoothing,0,0.949443519115,0,0.947313249111,0.24,0.944354891777,4.11,0.939673125744,14.71,0.931363999844,19.41,0.916236400604,20.32,0.884660482407,20.81,0.828287780285,20.94,0.750048518181,21.06,0.653227627277,21.2,0.542895674706
sparse_transformer_variational_dropout,2.22222222222e-7,linear,200000,100000,none,0.09,0.948185801506,0.11,0.945783674717,0.19,0.942386090755,1.53,0.936905741692,15.05,0.927440881729,19.9,0.911073684692,20.86,0.88021916151,21.14,0.824357450008,21.36,0.742809593678,21.45,0.640885293484,21.27,0.527206838131
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,200000,100000,dropout+label_smoothing,0.08,0.958377182484,0.17,0.955043435097,0.35,0.950850844383,3.93,0.944793760777,17.43,0.934985280037,19.1,0.918431460857,19.4,0.886726498604,19.59,0.829413175583,19.66,0.748995363712,19.57,0.64999550581,19.67,0.538302183151
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,200000,100000,label_smoothing,0.05,0.952573359013,0.06,0.950717389584,0.14,0.948088645935,1.47,0.943764865398,14.21,0.935929954052,19.26,0.921594798565,20.33,0.890918493271,20.74,0.833832263947,20.95,0.752944052219,20.93,0.651806712151,20.96,0.536612868309
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,200000,100000,none,0.11,0.951451420784,0.13,0.949365198612,0.34,0.946363449097,4.5,0.941380500793,17.69,0.932565391064,20.15,0.916981816292,20.85,0.886940479279,21.1,0.830496549606,21.24,0.74581360817,21.08,0.639020681381,21.16,0.520426690578
sparse_transformer_variational_dropout,2.22222222222e-7,linear,300000,100000,dropout+label_smoothing,0.4,0.939298689365,1.66,0.935349881649,11.07,0.929867684841,18.43,0.921831905842,19.59,0.909748613834,20.08,0.890093684196,20.34,0.852843761444,20.38,0.79464840889,20.48,0.716376125813,20.45,0.620067119598,20.48,0.511726021767
sparse_transformer_variational_dropout,2.22222222222e-7,linear,300000,100000,label_smoothing,0.23,0.922187745571,0.58,0.919961869717,2.6,0.916576564312,13.9,0.911083400249,19.18,0.902002036572,20.62,0.885301828384,21.09,0.850777983665,21.32,0.795332610607,21.36,0.719392538071,21.62,0.62399828434,21.55,0.514829397202
sparse_transformer_variational_dropout,2.22222222222e-7,linear,300000,100000,none,0.16,0.920255303383,0.55,0.917880237103,5.57,0.914146125317,16.71,0.908048510551,19.86,0.898117125034,20.99,0.881034076214,21.45,0.848076105118,21.61,0.79255259037,21.76,0.7129804492,21.91,0.612467944622,21.82,0.499899744987
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,300000,100000,dropout+label_smoothing,0.4,0.943791329861,1.06,0.940420210361,10.07,0.935719549656,18.2,0.928735256195,19.54,0.917959213257,20.07,0.899785816669,20.22,0.863490104675,20.31,0.804519355297,20.27,0.723666012287,20.3,0.622736334801,20.3,0.508869588375
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,300000,100000,label_smoothing,0.11,0.927082479,0.36,0.925119400024,3.2,0.92211407423,14.97,0.917199730873,19.49,0.909020543098,20.76,0.893514931202,21.13,0.859710335732,21.48,0.803402721882,21.69,0.724401533604,21.76,0.623955130577,21.68,0.509292304516
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,300000,100000,none,0.12,0.924917936325,0.32,0.922850131989,3.81,0.919573605061,16.17,0.914220869541,20.34,0.905446112156,21.35,0.889888584614,21.71,0.858082711697,21.84,0.801736533642,22.03,0.718704283237,22.19,0.613036692142,22.11,0.495351880789
sparse_transformer_variational_dropout,2.22222222222e-7,linear,400000,100000,dropout+label_smoothing,19.31,0.89327943325,20.4,0.889396250248,20.78,0.884012699127,21.1,0.876335740089,21.34,0.864965379238,21.52,0.845102250576,21.56,0.808241188526,21.67,0.752477824688,21.63,0.677298426628,21.62,0.584962308407,21.69,0.482312679291
sparse_transformer_variational_dropout,2.22222222222e-7,linear,400000,100000,label_smoothing,16.32,0.849018335342,18.85,0.846618592739,20.54,0.843418955803,21.33,0.838952243328,21.74,0.831969797611,22.14,0.817489981651,22.39,0.787150144577,22.53,0.737705230713,22.53,0.66758710146,22.55,0.578725814819,22.56,0.478009104729
sparse_transformer_variational_dropout,2.22222222222e-7,linear,400000,100000,none,16.58,0.834359705448,19.61,0.831378400326,20.68,0.827619314194,21.42,0.822857618332,21.8,0.81613945961,22.02,0.803902387619,22.1,0.778178453445,22.29,0.732016146183,22.44,0.661469519138,22.43,0.569573998451,22.44,0.466196477413
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,400000,100000,dropout+label_smoothing,18.5,0.907960176468,19.56,0.904865682125,20.12,0.900375723839,20.48,0.893817067146,20.65,0.883818984032,20.88,0.865318477154,20.93,0.829054474831,20.95,0.772965729237,20.93,0.695774316788,21.03,0.598914325237,21.01,0.490111917257
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,400000,100000,label_smoothing,16.01,0.868887484074,18.79,0.867197871208,20.4,0.864645957947,21.08,0.860652148724,21.46,0.854013442993,21.78,0.839616298676,21.91,0.808742880821,21.95,0.75833940506,22.07,0.686295330524,22.02,0.593302726746,22,0.486582964659
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,400000,100000,none,17.68,0.860311746597,19.6,0.858401358128,20.81,0.855718612671,21.4,0.851740479469,21.86,0.845388948917,21.95,0.832806169987,22.05,0.805395245552,22.15,0.755993902683,22.17,0.680681824684,22.05,0.582580149174,22.05,0.472418606281
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,100000,dropout+label_smoothing,0.08,0.970701158047,0.11,0.966216444969,0.3,0.961340606213,2.71,0.955032348633,16.9,0.945102751255,19.42,0.928474843502,19.81,0.901345193386,19.93,0.855883955956,19.95,0.783419728279,19.95,0.697079122066,20,0.614165723324
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,100000,label_smoothing,0.11,0.974288105965,0.14,0.971260547638,0.58,0.967683672905,7.96,0.962465524673,17.83,0.953358113766,19.71,0.937527179718,20.24,0.910930156708,20.59,0.86471581459,20.82,0.792792677879,20.92,0.712579071522,20.88,0.638862550259
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,100000,none,0.08,0.971603393555,0.03,0.968236267567,0.14,0.964189291,2.73,0.958383977413,17.38,0.948337674141,20.48,0.930712342262,20.98,0.901168823242,21.29,0.852573812008,21.33,0.779628515244,21.41,0.696227252483,21.47,0.619377493858
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,100000,dropout+label_smoothing,0.15,0.97427457571,0.17,0.970588028431,0.21,0.966494858265,1.69,0.961008369923,16.38,0.952042818069,19.06,0.93677675724,19.36,0.911962151527,19.44,0.870939195156,19.43,0.804814934731,19.5,0.72223174572,19.51,0.642385840416
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,100000,label_smoothing,0.05,0.977472960949,0.1,0.974918842316,0.21,0.97183316946,3.32,0.967212021351,16.16,0.958975255489,18.99,0.944506108761,19.9,0.920312285423,20.13,0.879038989544,20.15,0.812941074371,20.34,0.735221147537,20.41,0.663585960865
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,100000,none,0.09,0.97505325079,0.24,0.972675383091,0.67,0.969641089439,8.02,0.964738130569,18.49,0.955637812614,19.9,0.939661383629,20.39,0.912939608097,20.55,0.868847548962,20.64,0.801703810692,20.73,0.723415672779,20.73,0.651353240013
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,100000,dropout+label_smoothing,0.08,0.957979917526,0.15,0.952737569809,0.36,0.946652650833,4.15,0.938382863998,18.76,0.925399661064,19.98,0.904241681099,20.34,0.868133246899,20.57,0.805065393448,20.66,0.719258069992,20.6,0.622637867928,20.67,0.523155391216
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,100000,label_smoothing,0.13,0.960141479969,0,0.956657409668,0.35,0.952244579792,3.39,0.945598900318,17.2,0.934232294559,19.98,0.914594233036,20.86,0.878526031971,21.28,0.814019382,21.5,0.727814674377,21.5,0.631583869457,21.56,0.532023251057
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,100000,none,0.05,0.957720637321,0.09,0.953851819038,0.3,0.948903799057,6.74,0.941442668438,18.03,0.928819835186,20.82,0.90762001276,21.33,0.871038258076,21.61,0.807752907276,21.71,0.719645261765,21.8,0.619915366173,21.81,0.518602609634
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,100000,dropout+label_smoothing,0.15,0.960401594639,0.18,0.955543577671,0.29,0.94990080595,2.39,0.942185163498,17.93,0.929843604565,19.84,0.909262478352,20.37,0.873732745647,20.48,0.810844182968,20.64,0.723607003689,20.61,0.625338971615,20.63,0.524298369884
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,100000,label_smoothing,0.09,0.962404668331,0.1,0.959217309952,0.07,0.955114424229,1.57,0.948741316795,17.44,0.937656879425,20.19,0.918489873409,21,0.883049607277,21.43,0.818249642849,21.59,0.730164945126,21.67,0.631566762924,21.61,0.529915213585
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,100000,none,0.05,0.960027575493,0.06,0.956569969654,0.22,0.95204025507,7.08,0.944948256016,18.46,0.932735741138,20.67,0.911988377571,21.13,0.875765144825,21.37,0.812414050102,21.46,0.72315955162,21.69,0.621961176395,21.66,0.519152998924
sparse_transformer_variational_dropout,1.55555555556e-7,linear,200000,100000,dropout+label_smoothing,0.13,0.946134209633,0.19,0.940803050995,0.58,0.933983147144,11.65,0.924127936363,19.69,0.908905088902,20.53,0.884519517422,20.82,0.840899825096,20.97,0.77169418335,21.01,0.683056116104,20.96,0.581817388535,20.93,0.475822746754
sparse_transformer_variational_dropout,1.55555555556e-7,linear,200000,100000,label_smoothing,0,0.941418647766,0.07,0.938159763813,0.25,0.933541834354,4.7,0.926107823849,18.12,0.913419425488,20.73,0.891251564026,21.53,0.848142027855,21.72,0.779132425785,21.82,0.690196692944,21.91,0.58755427599,21.93,0.478835821152
sparse_transformer_variational_dropout,1.55555555556e-7,linear,200000,100000,none,0.41,0.934875786304,2.53,0.928041636944,14.88,0.91873639822,19.66,0.905538976192,20.79,0.885803937912,21.23,0.854398310184,21.54,0.801632702351,21.77,0.721644937992,21.86,0.623358726501,21.86,0.519611179829,21.89,0.420092880726
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,200000,100000,dropout+label_smoothing,0.15,0.949242830276,0.28,0.94433683157,1.33,0.938037753105,15.91,0.928817868233,20.02,0.914236545563,20.56,0.890555500984,20.96,0.847447752953,20.98,0.777252495289,21.02,0.686281323433,21.02,0.582130789757,20.96,0.47297501564
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,200000,100000,label_smoothing,0.09,0.944870889187,0.15,0.941954851151,0.86,0.937724769115,10.67,0.930665135384,19.51,0.918420612812,20.85,0.896740019321,21.35,0.853588104248,21.36,0.782908737659,21.62,0.691216409206,21.68,0.585207760334,21.65,0.473033756018
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,200000,100000,none,0.09,0.942464888096,0.11,0.939234316349,0.73,0.934508144855,11.34,0.92672842741,19.6,0.913619279861,21.17,0.891274452209,21.75,0.849888861179,22.05,0.780004501343,22.04,0.685379505157,22.14,0.575812220573,22.08,0.46234613657
sparse_transformer_variational_dropout,1.55555555556e-7,linear,300000,100000,dropout+label_smoothing,0.58,0.928471028805,4.43,0.922671735287,16.99,0.914550364017,20.09,0.902831614017,20.89,0.885740816593,21.19,0.858414471149,21.26,0.81021797657,21.41,0.740241706371,21.38,0.652165174484,21.39,0.551403582096,21.46,0.446202546358
sparse_transformer_variational_dropout,1.55555555556e-7,linear,300000,100000,label_smoothing,0.13,0.911848068237,0.83,0.908449590206,9.51,0.9031214118,18.61,0.894628107548,20.86,0.881060957909,21.6,0.856983423233,21.92,0.811623811722,22.2,0.744138777256,22.27,0.657518267632,22.23,0.556907117367,22.26,0.450432568789
sparse_transformer_variational_dropout,1.55555555556e-7,linear,300000,100000,none,0.38,0.907833635807,2.3,0.904153943062,11.99,0.898399055004,19.95,0.889312028885,21.52,0.875129163265,22.41,0.851264297962,22.56,0.80775642395,22.59,0.739819526672,22.76,0.649841964245,22.75,0.545706272125,22.85,0.437846958637
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,300000,100000,dropout+label_smoothing,0.99,0.933124899864,6.3,0.928025126457,17.66,0.92075330019,20.18,0.909833788872,20.97,0.893337845802,21.23,0.86634594202,21.16,0.817560076714,21.24,0.745368659496,21.16,0.653582513332,21.23,0.54842042923,21.24,0.439174562693
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,300000,100000,label_smoothing,0.07,0.917198121548,0.57,0.914146065712,8.06,0.909405827522,18.07,0.901773750782,20.72,0.889322519302,21.41,0.866355478764,21.89,0.821186184883,21.92,0.752198517323,22,0.662433981895,22.02,0.557579040527,22.07,0.447093069553
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,300000,100000,none,0.22,0.913765609264,1.9,0.910483241081,13.16,0.905322730541,19.76,0.897100806236,21.51,0.884026706219,22.1,0.861261308193,22.31,0.818022370338,22.66,0.748436331749,22.58,0.655078232288,22.55,0.546500623226,22.58,0.434468626976
sparse_transformer_variational_dropout,1.55555555556e-7,linear,400000,100000,dropout+label_smoothing,20.24,0.87130355835,21.35,0.865467846394,21.79,0.857919216156,22.24,0.847638487816,22.34,0.832644701004,22.55,0.806875050068,22.63,0.761503219604,22.58,0.695658624172,22.56,0.611482918262,22.66,0.515240013599,22.64,0.415883541107
sparse_transformer_variational_dropout,1.55555555556e-7,linear,400000,100000,label_smoothing,18.97,0.821712195873,20.97,0.817571461201,21.71,0.812576174736,22.31,0.80624717474,22.45,0.796816408634,22.82,0.777729153633,23.02,0.739747583866,23.1,0.68008852005,23.18,0.600546002388,23.19,0.5077085495,23.2,0.410938978195
sparse_transformer_variational_dropout,1.55555555556e-7,linear,400000,100000,none,20.04,0.797230362892,21.48,0.791895031929,22.24,0.785795688629,22.73,0.778675615788,22.99,0.769191086292,23.16,0.752330243587,23.27,0.718529343605,23.31,0.661684572697,23.34,0.582087039948,23.44,0.487828224897,23.46,0.390633285046
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,400000,100000,dropout+label_smoothing,19.9,0.892443239689,20.96,0.887956440449,21.14,0.881579637527,21.68,0.872309148312,21.75,0.858227670193,21.93,0.832818210125,22.04,0.786816120148,22.16,0.719251275063,22.16,0.632091701031,22.15,0.531183540821,22.12,0.426560878754
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,400000,100000,label_smoothing,17.82,0.849693059921,19.95,0.847022891045,21.34,0.843285143375,21.92,0.837637603283,22.31,0.828247189522,22.47,0.808355987072,22.52,0.768567740917,22.65,0.706503093243,22.68,0.623137533665,22.67,0.524743974209,22.63,0.42134219408
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,400000,100000,none,17.69,0.836506009102,20.12,0.833305835724,21.36,0.829167664051,21.88,0.823435604572,22.18,0.814439177513,22.45,0.796788573265,22.76,0.760490953922,22.65,0.699550807476,22.74,0.614331901073,22.84,0.513293147087,22.8,0.408723980188
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,100000,dropout+label_smoothing,0.2,0.953252315521,0.27,0.946413218975,1.71,0.938469171524,16.3,0.927281975746,20.42,0.909350574017,21.05,0.880952894688,21.02,0.837233960629,21.28,0.769985973835,21.42,0.680428266525,21.44,0.590159356594,21.46,0.509084880352
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,100000,label_smoothing,0.08,0.959366858006,0.13,0.954687356949,0.46,0.948742568493,12.15,0.939419090748,20.53,0.923260748386,21.82,0.896609783173,22.13,0.854278028011,22.29,0.787901103497,22.35,0.702519595623,22.41,0.619810640812,22.39,0.547609806061
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,100000,none,0.09,0.955571591854,0.28,0.95091843605,2.91,0.944755911827,17.43,0.934778630733,20.82,0.917374968529,21.67,0.888752698898,21.89,0.844037294388,22.15,0.777474820614,22.23,0.691992640495,22.22,0.607278168201,22.24,0.534005641937
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,100000,dropout+label_smoothing,0.25,0.95857834816,0.39,0.952822744846,1.58,0.946046829224,15.61,0.936177909374,20.34,0.919916272163,20.72,0.893891096115,21.03,0.853872179985,21.03,0.792806327343,21.06,0.709286153316,21.07,0.623136520386,21.18,0.547112107277
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,100000,label_smoothing,0.05,0.964473128319,0.08,0.960704863071,0.77,0.955714225769,14.35,0.947437167168,20,0.932604491711,21.05,0.908002495766,21.59,0.869108736515,21.75,0.808480501175,21.9,0.727919340134,22.07,0.64861446619,21.98,0.580610096455
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,100000,none,0.08,0.961444735527,0.11,0.95774269104,0.78,0.952601373196,15.08,0.943722248077,20.56,0.927756726742,21.3,0.901275992393,21.73,0.85995388031,21.8,0.798743546009,21.77,0.719010055065,21.73,0.63945633173,21.68,0.571474313736
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,100000,dropout+label_smoothing,0.14,0.939311981201,0.24,0.930913388729,2.27,0.920635104179,18.56,0.9059497118,21.27,0.883425533772,21.63,0.848746836185,21.93,0.792885005474,21.85,0.709404587746,21.95,0.61210244894,21.84,0.513037621975,21.77,0.419198513031
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,100000,label_smoothing,0.03,0.942860424519,0.06,0.936827719212,1.19,0.928705394268,16.25,0.91608518362,20.91,0.895596325397,22.04,0.862410187721,22.57,0.805822312832,22.61,0.721783638,22.71,0.625555932522,22.75,0.528038024902,22.75,0.434893488884
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,100000,none,0.06,0.939478814602,0.17,0.933077454567,1.75,0.924369454384,17.06,0.910917758942,21.47,0.889299035072,22.59,0.854794025421,22.71,0.799018263817,22.91,0.716151475906,22.97,0.617875099182,22.97,0.517919540405,23.02,0.423813790083
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,100000,dropout+label_smoothing,0.16,0.941460072994,0.3,0.933628022671,2.32,0.924018144608,18.21,0.910132586956,21.13,0.888296544552,21.73,0.85415905714,22.04,0.798880398273,22.15,0.714876532555,22.16,0.616210222244,22.17,0.516119599342,22.12,0.421638339758
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,100000,label_smoothing,0.05,0.945602715015,0.12,0.940235733986,0.52,0.932977497578,12.64,0.921471953392,20.62,0.902142882347,22.05,0.869911670685,22.46,0.814300239086,22.5,0.729986011982,22.57,0.632568120956,22.59,0.533866465092,22.64,0.43966114521
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,100000,none,0.06,0.942028701305,0.18,0.936129152775,1.56,0.928046584129,17.4,0.915233075619,21.35,0.894349932671,22.08,0.860644578934,22.6,0.805640697479,22.65,0.722812771797,22.51,0.623405992985,22.58,0.522174596786,22.55,0.427115678787
sparse_transformer_variational_dropout,8.88888888889e-8,linear,200000,100000,dropout+label_smoothing,0.19,0.925338327885,0.8,0.916147649288,11.8,0.904022872448,20.6,0.88664484024,21.7,0.860999524593,22.1,0.821954786777,22.27,0.758246123791,22.4,0.671688556671,22.44,0.5732858181,22.41,0.472227066755,22.48,0.375942498446
sparse_transformer_variational_dropout,8.88888888889e-8,linear,200000,100000,label_smoothing,0.1,0.922442018986,0.44,0.916167497635,5.9,0.907097697258,18.86,0.892860114574,21.6,0.870392024517,22.41,0.833430290222,22.69,0.770241856575,22.88,0.684098005295,23.01,0.585773646832,23.11,0.483989089727,23.09,0.386058747768
sparse_transformer_variational_dropout,8.88888888889e-8,linear,200000,100000,none,0.15,0.918119966984,0.9,0.911177277565,12.16,0.901121139526,20.13,0.885783791542,22.02,0.862141430378,22.53,0.824550151825,22.93,0.762665629387,23,0.675792753696,23.14,0.574704527855,23.13,0.470464795828,23.12,0.371900141239
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,200000,100000,dropout+label_smoothing,0.16,0.928718328476,0.64,0.920211553574,10.76,0.908969819546,20.42,0.892537891865,21.68,0.867881298065,22.05,0.829605937004,22.3,0.766104996204,22.39,0.678201258183,22.37,0.577777981758,22.43,0.47455868125,22.4,0.376272290945
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,200000,100000,label_smoothing,0.09,0.926152765751,0.23,0.920544207096,2.85,0.912360727787,17.77,0.899214923382,21.47,0.878004789352,22.31,0.842267811298,22.83,0.779675245285,22.81,0.692614912987,22.93,0.592255353928,22.87,0.487825095654,22.87,0.387228399515
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,200000,100000,none,0.08,0.921983122826,0.42,0.915639460087,7.35,0.906278908253,20.09,0.891634941101,22.03,0.868697404861,22.65,0.831597864628,22.8,0.769707918167,23,0.681407511234,23.01,0.578227221966,23.18,0.471802145243,23.09,0.371285170317
sparse_transformer_variational_dropout,8.88888888889e-8,linear,300000,100000,dropout+label_smoothing,6.29,0.903463542461,18.07,0.893042385578,21.18,0.878722548485,22,0.859107911587,22.36,0.831680119038,22.51,0.789490580559,22.66,0.723123192787,22.73,0.637322247028,22.7,0.540438473225,22.63,0.441159963608,22.68,0.347406178713
sparse_transformer_variational_dropout,8.88888888889e-8,linear,300000,100000,label_smoothing,2.1,0.886802256107,12.68,0.880097925663,19.57,0.869888246059,21.72,0.854675114155,22.45,0.831753134727,22.99,0.793014705181,23.06,0.729397058487,23.1,0.645501792431,23.12,0.549603223801,23.2,0.450569093227,23.18,0.356353223324
sparse_transformer_variational_dropout,8.88888888889e-8,linear,300000,100000,none,4.56,0.876725256443,15.91,0.869348585606,20.2,0.858530938625,22.14,0.842852830887,22.78,0.819612503052,23.1,0.781882464886,23.41,0.720264494419,23.5,0.63631093502,23.49,0.538854897022,23.59,0.438796639442,23.58,0.345131576061
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,300000,100000,dropout+label_smoothing,4.03,0.909615457058,16.79,0.900209248066,20.95,0.887182354927,21.77,0.869022071362,22.14,0.842848837376,22.35,0.801317453384,22.38,0.734158277512,22.42,0.646202147007,22.32,0.546561837196,22.31,0.444640040398,22.32,0.348579794168
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,300000,100000,label_smoothing,0.46,0.894136428833,5.28,0.888060629368,17.99,0.878746747971,21.43,0.864581227303,22.48,0.842599868774,22.7,0.804443478584,23.03,0.740120828152,23.22,0.654312968254,23.17,0.555632472038,23.2,0.453434169292,23.23,0.356107592583
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,300000,100000,none,2.58,0.886551499367,13.7,0.879781424999,20.27,0.869712591171,22.05,0.854856133461,22.78,0.832320690155,23.26,0.794938921928,23.4,0.732507646084,23.48,0.646374046803,23.51,0.54609900713,23.55,0.443025410175,23.56,0.346517831087
sparse_transformer_variational_dropout,8.88888888889e-8,linear,400000,100000,dropout+label_smoothing,22.99,0.821446835995,23.4,0.811379313469,23.61,0.799826204777,23.69,0.785254597664,23.87,0.764327585697,23.91,0.728422403336,23.98,0.669384837151,24.04,0.590481102467,24.08,0.4993930161,24.04,0.406090676785,24.01,0.318878918886
sparse_transformer_variational_dropout,8.88888888889e-8,linear,400000,100000,label_smoothing,22.4,0.747917115688,23.5,0.738935053349,23.86,0.729526877403,24.08,0.718901634216,24.27,0.704105019569,24.54,0.675624191761,24.69,0.624162316322,24.72,0.55151951313,24.78,0.46641716361,24.75,0.379252672195,24.78,0.297940611839
sparse_transformer_variational_dropout,8.88888888889e-8,linear,400000,100000,none,22.91,0.700116276741,23.41,0.689485728741,23.78,0.678769886494,23.85,0.667290985584,23.96,0.652505278587,24.01,0.626816809177,24.04,0.580577969551,24.11,0.513006925583,24.07,0.431878715754,24.12,0.348582834005,24.11,0.271801441908
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,400000,100000,dropout+label_smoothing,21.81,0.85502076149,22.54,0.847106993198,22.85,0.836663246155,23.08,0.821973383427,23.23,0.799695611,23.41,0.760955512524,23.43,0.697950124741,23.46,0.614624798298,23.45,0.519194066525,23.49,0.421415477991,23.45,0.32993003726
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,400000,100000,label_smoothing,20.81,0.803146123886,22.01,0.797232568264,22.7,0.790147840977,23.08,0.780563533306,23.29,0.7649320364,23.38,0.733506500721,23.46,0.677299559116,23.49,0.598817408085,23.66,0.506686329842,23.65,0.411718159914,23.68,0.322536051273
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,400000,100000,none,21.25,0.774829506874,22.16,0.76745647192,22.85,0.759141147137,23.15,0.748888194561,23.53,0.733530938625,23.6,0.704603016376,23.6,0.652205944061,23.72,0.576481997967,23.62,0.485955446959,23.76,0.392677724361,23.73,0.306274175644
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,100000,dropout+label_smoothing,0.61,0.870413661003,13.21,0.851974904537,22.99,0.825658261776,23.96,0.78705072403,24.01,0.733384370804,24.17,0.663701295853,24.16,0.579018294811,24.18,0.483120054007,24.17,0.393056094646,24.2,0.31714001298,24.19,0.254841089249
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,100000,label_smoothing,0.4,0.880720376968,6.45,0.866599202156,21.19,0.844742357731,23.71,0.810616791248,24.31,0.760991752148,24.52,0.694385647774,24.54,0.611185193062,24.7,0.517526865005,24.7,0.431424468756,24.69,0.359247893095,24.7,0.299735039473
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,100000,none,1.57,0.8712849617,14.97,0.857253134251,22.32,0.835031569004,23.77,0.800167858601,24.19,0.749213814735,24.36,0.681459128857,24.48,0.599349379539,24.61,0.507649421692,24.58,0.420518577099,24.58,0.347435593605,24.59,0.287723869085
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,100000,dropout+label_smoothing,0.51,0.881281733513,11.55,0.864327132702,22.41,0.839682519436,23.49,0.802990674973,23.86,0.751663863659,24.04,0.685116291046,24.1,0.604595303535,24.09,0.512942552567,24.13,0.42529168725,24.11,0.351910591125,24.12,0.29200771451
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,100000,label_smoothing,0.73,0.894801914692,12.51,0.88222193718,22.26,0.861954569817,23.72,0.829618155956,23.97,0.782347381115,24.15,0.719153523445,24.31,0.640705287457,24.31,0.551191449165,24.36,0.467575877905,24.27,0.398261368275,24.33,0.341678589582
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,100000,none,1.41,0.887131631374,16.87,0.874336600304,22.21,0.853284835815,23.57,0.81960940361,23.98,0.770349979401,24.26,0.705363035202,24.28,0.627380669117,24.37,0.540466547012,24.44,0.456703096628,24.42,0.38692715764,24.49,0.330476820469
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,100000,dropout+label_smoothing,5.85,0.842679738998,21.55,0.819525003433,24.14,0.787941038609,24.51,0.744618475437,24.6,0.686405181885,24.69,0.610901296139,24.77,0.517946302891,24.77,0.421707481146,24.7,0.334612041712,24.68,0.260250091553,24.68,0.199030563235
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,100000,label_smoothing,4.78,0.842800855637,18.24,0.823232829571,23.56,0.795258700848,24.55,0.755374670029,24.97,0.699616789818,25.03,0.624675631523,25.07,0.53108805418,25.19,0.434965521097,25.22,0.347970873117,25.21,0.273375451565,25.21,0.211340144277
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,100000,none,11.35,0.82287478447,20.72,0.802627503872,23.61,0.774157524109,24.57,0.733573198318,24.98,0.676654875278,25.19,0.601912558079,25.1,0.511236727238,25.24,0.416798233986,25.24,0.330800533295,25.23,0.257614642382,25.23,0.197553947568
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,100000,dropout+label_smoothing,2.65,0.847856581211,20.33,0.82563495636,23.65,0.795041322708,24.37,0.752427220345,24.67,0.694477498531,24.68,0.619133174419,24.7,0.526075959206,24.64,0.428581684828,24.65,0.340039402246,24.68,0.264372199774,24.69,0.202030777931
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,100000,label_smoothing,1.73,0.850228488445,17.26,0.831472814083,23.4,0.804181158543,24.52,0.764724552631,24.98,0.709155023098,24.98,0.634242892265,25.01,0.540420770645,25.05,0.443570196629,24.97,0.355916947126,25.07,0.280841648579,25.05,0.218321725726
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,100000,none,9.13,0.832586944103,20.41,0.813354253769,23.78,0.785605609417,24.62,0.745365977287,24.93,0.688615858555,25.14,0.613618314266,25.21,0.522447645664,25.1,0.426689118147,25.17,0.339381247759,25.17,0.264925211668,25.18,0.203691929579
sparse_transformer_variational_dropout,2.22222222222e-8,linear,200000,100000,dropout+label_smoothing,20.93,0.815386116505,24.18,0.789691269398,24.79,0.756415009499,25.04,0.712421476841,24.99,0.653807580471,25.03,0.576968550682,25.12,0.484660834074,25.14,0.392664372921,25.16,0.309766441584,25.15,0.239237949252,25.12,0.181480273604
sparse_transformer_variational_dropout,2.22222222222e-8,linear,200000,100000,label_smoothing,19.42,0.795797646046,23.24,0.774210333824,24.62,0.745376110077,25.14,0.705766499043,25.42,0.650341629982,25.41,0.574676990509,25.51,0.483178257942,25.5,0.391854792833,25.54,0.309618026018,25.54,0.239798724651,25.56,0.182624697685
sparse_transformer_variational_dropout,2.22222222222e-8,linear,200000,100000,none,20.87,0.758678615093,23.7,0.737134158611,24.85,0.709409952164,25.17,0.671072244644,25.35,0.617113351822,25.49,0.544958114624,25.41,0.458436459303,25.4,0.371173381805,25.38,0.292267620564,25.36,0.225375860929,25.37,0.171154856682
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,200000,100000,dropout+label_smoothing,20.6,0.8229367733,23.72,0.798115968704,24.46,0.765526473522,24.62,0.722086250782,24.83,0.663590073586,24.9,0.586518645287,24.93,0.493440270424,24.94,0.400128275156,24.92,0.315893083811,24.86,0.244075700641,24.86,0.185133114457
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,200000,100000,label_smoothing,17.02,0.808495938778,22.3,0.787500977516,24.18,0.758876383305,24.69,0.71917039156,25.01,0.663495361805,25.01,0.587456226349,25.1,0.494979023933,25.12,0.402441442013,25.11,0.318930119276,25.06,0.247701838613,25.1,0.189126163721
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,200000,100000,none,20.97,0.776925206184,23.65,0.755721926689,24.57,0.727744102478,25.01,0.688604474068,25.09,0.633408248425,25.33,0.559683918953,25.27,0.471238911152,25.27,0.38172441721,25.28,0.300697147846,25.29,0.231980070472,25.3,0.176126122475
sparse_transformer_variational_dropout,2.22222222222e-8,linear,300000,100000,dropout+label_smoothing,24.51,0.764627158642,25.2,0.741452634335,25.29,0.71224540472,25.47,0.672850310802,25.56,0.618233084679,25.61,0.544060707092,25.62,0.456114143133,25.6,0.36891824007,25.58,0.290388286114,25.53,0.223627999425,25.54,0.169213116169
sparse_transformer_variational_dropout,2.22222222222e-8,linear,300000,100000,label_smoothing,24.51,0.684895038605,25.2,0.665892601013,25.44,0.642903029919,25.58,0.610676229,25.79,0.562923312187,25.81,0.494531691074,25.84,0.412990957499,25.82,0.332433342934,25.69,0.260916560888,25.7,0.200959056616,25.71,0.152416959405
sparse_transformer_variational_dropout,2.22222222222e-8,linear,300000,100000,none,24.6,0.612245798111,24.83,0.593762814999,24.86,0.571986019611,25.02,0.541440784931,24.9,0.496564239264,24.98,0.43458995223,24.97,0.361626625061,25,0.289448738098,25.01,0.225284188986,25.04,0.171982854605,25.04,0.129398807883
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,300000,100000,dropout+label_smoothing,24.01,0.780744671822,24.67,0.757125079632,25.07,0.727033674717,25.26,0.686537802219,25.32,0.630613684654,25.45,0.55487960577,25.44,0.465191811323,25.39,0.376260429621,25.38,0.296125501394,25.38,0.228040710092,25.39,0.172477573156
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,300000,100000,label_smoothing,23.62,0.720368802547,24.66,0.700950145721,24.96,0.676633954048,25.07,0.642370402813,25.25,0.59207701683,25.38,0.520828008652,25.21,0.435847967863,25.2,0.351739048958,25.18,0.276562571526,25.24,0.213285729289,25.27,0.161894232035
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,300000,100000,none,24.09,0.658901631832,24.94,0.63940268755,25.11,0.616052985191,25.32,0.583540797234,25.42,0.536069095135,25.43,0.470645904541,25.41,0.39308822155,25.33,0.315902680159,25.4,0.246812090278,25.43,0.189069628716,25.27,0.142678022385
sparse_transformer_variational_dropout,2.22222222222e-8,linear,400000,100000,dropout+label_smoothing,26.45,0.589960038662,26.52,0.578570961952,26.48,0.565403819084,26.54,0.54568862915,26.57,0.512353658676,26.53,0.458100020885,26.54,0.388292849064,26.53,0.316021591425,26.52,0.249368950725,26.55,0.192117601633,26.53,0.145283475518
sparse_transformer_variational_dropout,2.22222222222e-8,linear,400000,100000,label_smoothing,24.6,0.400576263666,24.74,0.391955822706,24.69,0.379792839289,24.75,0.359453052282,24.73,0.326992422342,24.72,0.280704706907,24.72,0.229668259621,24.79,0.182464942336,24.75,0.142031788826,24.76,0.108864761889,24.76,0.0825294330716
sparse_transformer_variational_dropout,2.22222222222e-8,linear,400000,100000,none,22.92,0.335340231657,23,0.326741337776,23.01,0.31352737546,22.95,0.292270898819,22.89,0.261532604694,22.94,0.221908405423,22.83,0.180374369025,22.87,0.143083766103,22.88,0.111800774932,22.88,0.0865866392851,22.86,0.0666953772306
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,400000,100000,dropout+label_smoothing,25.95,0.662702620029,26.11,0.648449003696,26.12,0.630890011787,26.14,0.604656040668,26.16,0.56283468008,26.26,0.499414175749,26.3,0.421175450087,26.29,0.341645419598,26.24,0.269143313169,26.24,0.207264438272,26.21,0.156747832894
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,400000,100000,label_smoothing,25.12,0.494709551334,25.21,0.483528614044,25.3,0.469140589237,25.28,0.446100056171,25.25,0.408824920654,25.3,0.354302346706,25.29,0.291682451963,25.28,0.232336193323,25.34,0.180958196521,25.26,0.138515993953,25.35,0.104518525302
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,400000,100000,none,23.75,0.418273389339,23.93,0.407525092363,23.86,0.392394244671,23.84,0.368355929852,23.76,0.33259254694,23.66,0.28499981761,23.72,0.232954934239,23.66,0.184723377228,23.69,0.14374153316,23.69,0.110515028238,23.69,0.0842902809381
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,200000,dropout+label_smoothing,0.12,0.975886642933,0.11,0.971915125847,0.14,0.96769952774,0.56,0.96264231205,9.19,0.955166220665,18.15,0.942670702934,18.91,0.921697795391,19.11,0.884961724281,19.32,0.821496188641,19.34,0.739573657513,19.39,0.655601084232
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,200000,label_smoothing,0.11,0.978768467903,0,0.975735127926,0,0.972313463688,0.56,0.967885792255,9.92,0.96086448431,17.98,0.948584079742,19.53,0.927455663681,19.83,0.889144957066,20.05,0.824206352234,20.2,0.745314776897,20.25,0.667982876301
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,200000,none,0.09,0.97571003437,0.09,0.972641050816,0.21,0.96912586689,1.86,0.964387178421,15.69,0.956634700298,19.16,0.943138420582,20.21,0.920070111752,20.67,0.880000054836,20.88,0.814463615417,20.85,0.733973145485,20.89,0.655527770519
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,200000,dropout+label_smoothing,0.2,0.978952586651,0.2,0.975730717182,0.22,0.972314357758,1.01,0.96806126833,13.71,0.961456179619,18.01,0.950241863728,18.57,0.931550264359,18.74,0.899368286133,18.93,0.842715501785,18.91,0.764542341232,18.89,0.68330848217
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,200000,label_smoothing,0.07,0.981772661209,0.07,0.979103207588,0.13,0.975961506367,1.18,0.971764087677,11.92,0.964986264706,17.8,0.953393876553,19.03,0.933868527412,19.5,0.899568796158,19.73,0.840263187885,19.69,0.764162242413,19.84,0.689593732357
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,200000,none,0.11,0.979000449181,0.18,0.976633071899,0.76,0.973887205124,4.95,0.970016479492,16.07,0.963366091251,19.13,0.951324164867,19.95,0.930561184883,20.34,0.894415855408,20.53,0.834191739559,20.54,0.756947875023,20.53,0.68105661869
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,200000,dropout+label_smoothing,0.1,0.963757634163,0.18,0.959329605103,0.27,0.954259157181,1.62,0.947740852833,15.63,0.937933027744,19,0.921900808811,19.47,0.894197165966,19.69,0.842816948891,19.84,0.767582178116,19.93,0.677763283253,20.03,0.579687058926
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,200000,label_smoothing,0,0.964288175106,0,0.961296021938,0,0.957638800144,0.3,0.952552616596,10.03,0.944180488586,18.56,0.929517328739,20.09,0.901817023754,20.4,0.848529398441,20.55,0.772344887257,20.67,0.682111501694,20.69,0.583812952042
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,200000,none,0.08,0.962760031223,0.09,0.959423780441,0.22,0.955283463001,1.37,0.949364066124,13,0.939620912075,19.4,0.923024296761,20.82,0.894008934498,21.34,0.841566979885,21.38,0.763499379158,21.44,0.669594585896,21.41,0.568826973438
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,200000,dropout+label_smoothing,0.08,0.967134892941,0.14,0.963325679302,0.21,0.959038436413,0.62,0.953490376472,11.88,0.944833099842,18.76,0.930196225643,19.35,0.904398262501,19.78,0.855464696884,19.83,0.780535042286,19.89,0.689916610718,19.86,0.590742588043
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,200000,label_smoothing,0.04,0.968099892139,0.15,0.965613424778,0.17,0.962517917156,0.8,0.957997918129,10.87,0.950211644173,18.71,0.936384797096,20.1,0.910317122936,20.39,0.858804941177,20.66,0.781921744347,20.68,0.690181910992,20.68,0.589793205261
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,200000,none,0,0.966164171696,0,0.963439464569,0.16,0.960007667542,1.89,0.954904735088,16.9,0.946168124676,19.88,0.931010186672,20.58,0.904159963131,21.02,0.854007422924,21.06,0.775826871395,21.12,0.680019497871,21.16,0.576788187027
sparse_transformer_variational_dropout,2.22222222222e-7,linear,200000,200000,dropout+label_smoothing,0.14,0.951056480408,0.23,0.946488440037,0.6,0.940750837326,9.07,0.932815730572,18.48,0.920886039734,19.59,0.901993274689,20.13,0.867610573769,20.24,0.810332477093,20.35,0.733322143555,20.38,0.64033806324,20.43,0.536538004875
sparse_transformer_variational_dropout,2.22222222222e-7,linear,200000,200000,label_smoothing,0.04,0.94459426403,0.04,0.941829562187,0.1,0.938051104546,1.4,0.932282805443,15.44,0.922608554363,19.72,0.90582972765,20.87,0.872004210949,21.22,0.814925909042,21.32,0.738287389278,21.38,0.645020246506,21.36,0.539559066296
sparse_transformer_variational_dropout,2.22222222222e-7,linear,200000,200000,none,0.11,0.943322300911,0.15,0.940213978291,0.37,0.93589425087,3.62,0.929321885109,17.45,0.918607592583,20.47,0.900798082352,21.07,0.868260204792,21.55,0.811917960644,21.64,0.731870293617,21.74,0.633104324341,21.76,0.523881852627
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,200000,200000,dropout+label_smoothing,0.13,0.955823481083,0.21,0.952094018459,0.37,0.947460949421,3.29,0.940907895565,17.33,0.930567860603,19.13,0.913549184799,19.55,0.881661057472,19.68,0.825182855129,19.78,0.746599316597,19.88,0.650213062763,19.87,0.541694819927
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,200000,200000,label_smoothing,0.09,0.949907779694,0.17,0.947773635387,0.28,0.944827377796,0.89,0.9401268363,11.22,0.931762516499,19.2,0.91649132967,20.49,0.884545266628,20.75,0.827394902706,21.04,0.748035013676,21.06,0.64980006218,21.16,0.538326621056
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,200000,200000,none,0.04,0.948647260666,0.05,0.946239113808,0.14,0.942833840847,2.04,0.937357902527,16.17,0.92792314291,20.22,0.911642074585,21.12,0.881010353565,21.33,0.825339317322,21.51,0.743544518948,21.53,0.640870511532,21.56,0.526166200638
sparse_transformer_variational_dropout,2.22222222222e-7,linear,300000,200000,dropout+label_smoothing,0.73,0.929882884026,4.43,0.92492890358,16.6,0.917887568474,19.49,0.907887339592,20.28,0.89378619194,20.66,0.872044026852,20.73,0.832962453365,20.84,0.774384737015,20.9,0.69762724638,20.85,0.604905068874,20.82,0.50197416544
sparse_transformer_variational_dropout,2.22222222222e-7,linear,300000,200000,label_smoothing,0.18,0.91165882349,0.83,0.908835947514,8.7,0.904373645782,18.08,0.897299528122,20.28,0.88637393713,21.07,0.867432713509,21.55,0.830774366856,21.75,0.774779260159,21.89,0.700466871262,21.81,0.609413325787,21.78,0.506729602814
sparse_transformer_variational_dropout,2.22222222222e-7,linear,300000,200000,none,0.3,0.907032430172,2.12,0.903947949409,13.37,0.89909863472,18.83,0.891574382782,20.77,0.880199432373,21.44,0.861796915531,21.83,0.827919900417,22.04,0.773096978664,22.18,0.69636875391,22.2,0.601173043251,22.12,0.495585978031
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,300000,200000,dropout+label_smoothing,0.43,0.940074682236,1.39,0.936198651791,11.85,0.930856108665,18.45,0.92298668623,19.68,0.911182761192,20.03,0.891917824745,20.1,0.854972600937,20.28,0.796612381935,20.31,0.717933297157,20.31,0.6207280159,20.35,0.511195600033
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,300000,200000,label_smoothing,0.12,0.922936737537,0.25,0.92068862915,1.6,0.917260408401,12.54,0.911713957787,19.44,0.902669966221,20.77,0.886110603809,21.26,0.851542294025,21.45,0.795888721943,21.52,0.719655036926,21.48,0.623806595802,21.51,0.513990938663
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,300000,200000,none,0.11,0.920384347439,0.37,0.918032407761,3.52,0.914358556271,15.38,0.908349335194,19.85,0.898678839207,21.1,0.882028579712,21.66,0.849618017673,21.93,0.794294536114,21.94,0.714485168457,22.02,0.613430440426,22.02,0.500206530094
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,200000,dropout+label_smoothing,0.12,0.967357158661,0.18,0.9620423913,0.29,0.956237077713,2.37,0.948835432529,16.47,0.937466740608,19.27,0.9189915061,19.68,0.889269828796,19.93,0.839233517647,20.1,0.762173771858,20.12,0.674242079258,20.11,0.589444816113
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,200000,label_smoothing,0,0.971000671387,0.32,0.967275679111,0.57,0.962934553623,5.62,0.956847906113,17.4,0.946628510952,20.02,0.929205417633,20.83,0.900032401085,21.07,0.849107503891,21.07,0.773068904877,21.15,0.691186487675,21.15,0.614907681942
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,200000,none,0.09,0.967408716679,0.18,0.963408052921,0.76,0.958679616451,8.88,0.951947748661,18.81,0.940673947334,20.62,0.921594023705,21.1,0.889963626862,21.22,0.837681472301,21.4,0.760668635368,21.5,0.675662577152,21.47,0.597299873829
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,200000,dropout+label_smoothing,0.11,0.97136169672,0.13,0.967067956924,0.2,0.962384819984,2.33,0.95627373457,17.1,0.946558117867,19.19,0.930334806442,19.68,0.903884530067,19.82,0.859705686569,19.94,0.788842558861,19.87,0.703339934349,19.95,0.621159493923
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,200000,label_smoothing,0.13,0.97470843792,0.15,0.971600413322,0.2,0.967915773392,4.67,0.96263307333,16.42,0.953547000885,19.55,0.937757015228,20.38,0.911374509335,20.55,0.865950644016,20.72,0.79490673542,20.82,0.714707374573,20.91,0.641024827957
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,200000,none,0.06,0.971948027611,0.09,0.969046354294,0.28,0.965511381626,5.23,0.960208952427,18.57,0.9508228302,20.24,0.934292256832,20.77,0.906448543072,20.83,0.860013723373,20.83,0.789254784584,20.96,0.707593083382,20.95,0.632169425488
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,200000,dropout+label_smoothing,0.11,0.954584360123,0.12,0.948551356792,0.32,0.941507160664,4.66,0.932139098644,18.68,0.917847335339,20.27,0.895125448704,20.67,0.856799185276,20.85,0.791678309441,20.9,0.705831348896,20.92,0.609893023968,20.97,0.51134955883
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,200000,label_smoothing,0.05,0.956006586552,0.08,0.951844632626,0.1,0.946592569351,0.9,0.938948631287,14.29,0.926308214664,20.32,0.90506875515,21.27,0.866406261921,21.51,0.799776136875,21.69,0.713611841202,21.7,0.618287742138,21.69,0.520250916481
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,200000,none,0,0.953710317612,0.06,0.949134409428,0.26,0.943312466145,5.82,0.934773027897,17.98,0.920967936516,20.7,0.898331284523,21.65,0.859841406345,21.93,0.795091331005,22.03,0.707536578178,22.24,0.609338700771,22.32,0.509377360344
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,200000,dropout+label_smoothing,0.12,0.958271980286,0.18,0.953041255474,0.36,0.946942031384,3.14,0.938685536385,18.48,0.925690829754,19.91,0.904450654984,20.39,0.868140280247,20.7,0.804717838764,20.72,0.718313336372,20.69,0.621310949326,20.68,0.521660506725
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,200000,label_smoothing,0,0.960150778294,0,0.956601321697,0.12,0.952104747295,1.5,0.945414841175,16.41,0.933997929096,20.34,0.914193093777,21.15,0.877652049065,21.47,0.812290906906,21.39,0.725263237953,21.55,0.628394424915,21.6,0.528701007366
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,200000,none,0.07,0.957700371742,0.1,0.953874707222,0.26,0.948958754539,3.88,0.941508412361,18.39,0.928911447525,20.89,0.907657980919,21.45,0.870860159397,21.7,0.80724465847,21.85,0.718394398689,21.8,0.617711544037,21.84,0.515454649925
sparse_transformer_variational_dropout,1.55555555556e-7,linear,200000,200000,dropout+label_smoothing,0.12,0.940994739532,0.31,0.934577524662,2.72,0.926366567612,17.47,0.914873182774,20.05,0.897890210152,20.69,0.871858298779,20.96,0.826384067535,21,0.757252335548,21.07,0.670525252819,21.06,0.572451412678,21.03,0.470050126314
sparse_transformer_variational_dropout,1.55555555556e-7,linear,200000,200000,label_smoothing,0.08,0.935475289822,0.1,0.9313108325,0.49,0.92549353838,8.98,0.916594028473,18.84,0.902291238308,20.85,0.878213882446,21.56,0.832954108715,21.86,0.763843536377,22.02,0.676841259003,22.07,0.57781624794,22.18,0.473554044962
sparse_transformer_variational_dropout,1.55555555556e-7,linear,200000,200000,none,0,0.93288487196,0.12,0.928248882294,1.88,0.921703219414,13.68,0.911688745022,20.03,0.895958065987,21.82,0.870751559734,22.24,0.826739728451,22.34,0.757414221764,22.23,0.667224764824,22.34,0.564374983311,22.32,0.45832028985
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,200000,200000,dropout+label_smoothing,0.23,0.946230530739,0.34,0.940893173218,1.04,0.934104144573,12.57,0.924399554729,19.59,0.909330666065,20.63,0.885221123695,20.82,0.841884195805,21.02,0.772733867168,20.94,0.684125423431,20.94,0.582731127739,21,0.476361274719
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,200000,200000,label_smoothing,0.04,0.941397607327,0.04,0.938176512718,0.16,0.933633804321,3.58,0.926336765289,18.14,0.913856089115,20.66,0.89197319746,21.4,0.849057018757,21.74,0.779897212982,21.92,0.690633773804,21.95,0.587624251842,21.9,0.478515654802
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,200000,200000,none,0.09,0.939291298389,0.12,0.935629665852,1.23,0.930357575417,13.29,0.921876966953,20.09,0.907920897007,21.43,0.884715020657,21.96,0.842718720436,21.99,0.773426830769,22.05,0.680874586105,22.07,0.57408452034,22.13,0.463368058205
sparse_transformer_variational_dropout,1.55555555556e-7,linear,300000,200000,dropout+label_smoothing,4.52,0.91659873724,14.9,0.909415841103,19.68,0.899299383163,20.78,0.88550901413,21.29,0.866579413414,21.61,0.837701618671,21.78,0.788569629192,21.89,0.7192684412,21.86,0.63336366415,21.87,0.536305367947,21.94,0.435936659575
sparse_transformer_variational_dropout,1.55555555556e-7,linear,300000,200000,label_smoothing,0.36,0.897051751614,3.38,0.892698347569,16,0.885954320431,20.4,0.87577688694,21.61,0.860631525517,22.29,0.835005164146,22.65,0.788777649403,22.81,0.721858918667,22.89,0.637634396553,22.88,0.541388511658,23.01,0.440799355507
sparse_transformer_variational_dropout,1.55555555556e-7,linear,300000,200000,none,2.47,0.889697790146,10.67,0.884826481342,18.71,0.877575278282,20.76,0.866975128651,21.82,0.851572930813,22.35,0.826842188835,22.61,0.783344984055,22.65,0.717305541039,22.72,0.631052970886,22.73,0.532187283039,22.8,0.430532425642
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,300000,200000,dropout+label_smoothing,0.46,0.928898870945,3.67,0.923106491566,17.25,0.914984107018,20.17,0.903309643269,20.72,0.886307656765,21.26,0.858977615833,21.33,0.810339987278,21.44,0.739849448204,21.45,0.651114046574,21.53,0.549777746201,21.54,0.444168359041
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,300000,200000,label_smoothing,0.17,0.912014305592,0.98,0.908627033234,10.17,0.903345763683,18.98,0.894949436188,21.04,0.881594836712,21.8,0.857674777508,22.11,0.81221473217,22.22,0.744448781013,22.32,0.657417178154,22.34,0.556221485138,22.34,0.44931614399
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,300000,200000,none,0.38,0.908322453499,2.57,0.904682695866,13.31,0.898983478546,19.64,0.889961659908,21.39,0.875953376293,22,0.85233694315,22.26,0.809000194073,22.34,0.741075217724,22.56,0.650898516178,22.55,0.54633140564,22.55,0.438074946404
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,200000,dropout+label_smoothing,0.18,0.94805508852,0.37,0.940014898777,0.97,0.930761277676,16.83,0.918028235435,20.61,0.898190319538,21.41,0.867391705513,21.6,0.820378661156,21.72,0.748086512089,21.8,0.655252039433,21.84,0.562744379044,21.84,0.47874724865
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,200000,label_smoothing,0,0.953642189503,0.11,0.947730302811,0.73,0.940438985825,9.92,0.929533720016,20.07,0.911447584629,21.56,0.882274746895,22.18,0.835921406746,22.33,0.763778448105,22.43,0.675047576427,22.49,0.589859843254,22.46,0.51402592659
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,200000,none,0,0.949262738228,0.2,0.943381369114,2.93,0.935891807079,18.05,0.924505531788,21.21,0.90539932251,22.19,0.874538600445,22.58,0.82667529583,22.75,0.755803585052,22.99,0.667169988155,22.88,0.58090621233,22.94,0.505178153515
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,200000,dropout+label_smoothing,0.15,0.953997850418,0.19,0.947262465954,1.18,0.939412236214,16.01,0.928258836269,20.24,0.910399794579,20.92,0.882199704647,21.13,0.838946342468,21.18,0.772719323635,21.16,0.6840736866,21.16,0.59422147274,21.19,0.514054834843
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,200000,label_smoothing,0,0.960173428059,0.12,0.95569396019,1.33,0.949977040291,14.41,0.940903067589,20.4,0.925141274929,21.43,0.899114072323,21.73,0.857672035694,21.8,0.792600989342,21.88,0.708147227764,22.02,0.626314043999,21.95,0.555070340633
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,200000,none,0.05,0.956577718258,0.09,0.952100515366,1,0.946202456951,15.11,0.93660312891,21.22,0.919804394245,22.02,0.891977548599,22.44,0.84840720892,22.62,0.783487975597,22.64,0.699165701866,22.57,0.614987552166,22.61,0.542189896107
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,200000,dropout+label_smoothing,0.15,0.934470057487,0.32,0.925020933151,4.17,0.913456082344,19.5,0.89724701643,21.49,0.873001158237,21.97,0.836399972439,22.23,0.778149306774,22.23,0.693871259689,22.21,0.597504198551,22.17,0.499733477831,22.15,0.407312422991
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,200000,label_smoothing,0,0.937274515629,0.14,0.930339574814,1.36,0.921124815941,15.15,0.907116889954,20.78,0.884903609753,21.94,0.849507331848,22.43,0.790142118931,22.57,0.705565989017,22.77,0.610433161259,22.79,0.514129459858,22.81,0.422312557697
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,200000,none,0.08,0.93303155899,0.25,0.925472736359,4.19,0.915388405323,18.62,0.90026050806,21.8,0.87698251009,22.51,0.840817272663,22.93,0.783273398876,22.94,0.699687600136,23.04,0.602315068245,23.06,0.503486037254,23.13,0.410338163376
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,200000,dropout+label_smoothing,0.11,0.938991844654,0.25,0.930623948574,2,0.920388102531,18.56,0.905833184719,21.25,0.883334517479,21.76,0.848563611507,22.01,0.792442560196,22.1,0.708600223064,22.23,0.611194431782,22.19,0.512236595154,22.16,0.41854429245
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,200000,label_smoothing,0.05,0.943049132824,0.11,0.937089920044,0.58,0.929077148438,13.02,0.916536152363,20.8,0.896040320396,22.08,0.86262768507,22.64,0.805662930012,22.83,0.7212266922,22.85,0.624932408333,22.92,0.527447223663,22.91,0.434700995684
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,200000,none,0.06,0.939034044743,0.19,0.932675123215,1.47,0.924107193947,17.65,0.910803973675,21.2,0.889368474483,22.31,0.855055093765,22.84,0.799507379532,23.05,0.716546356678,22.99,0.617885112762,23.07,0.517486274242,23.07,0.423010617495
sparse_transformer_variational_dropout,8.88888888889e-8,linear,200000,200000,dropout+label_smoothing,0.35,0.918338894844,1.58,0.907599210739,15.63,0.893575191498,21.23,0.874180734158,22.12,0.84679877758,22.38,0.806121170521,22.58,0.741234540939,22.6,0.655323326588,22.59,0.558474123478,22.64,0.459506213665,22.66,0.365503966808
sparse_transformer_variational_dropout,8.88888888889e-8,linear,200000,200000,label_smoothing,0.17,0.913719773293,0.86,0.906065046787,11.04,0.895113050938,19.75,0.878733098507,21.97,0.854234099388,22.55,0.815330266953,22.69,0.750894725323,22.95,0.665461242199,22.97,0.568943321705,23.01,0.469868212938,22.99,0.375034302473
sparse_transformer_variational_dropout,8.88888888889e-8,linear,200000,200000,none,0.12,0.907579183578,0.94,0.89912122488,14.66,0.887092530727,20.86,0.86960619688,22.47,0.843988776207,23.12,0.804552733898,23.19,0.741528749466,23.25,0.655343651772,23.17,0.556442379951,23.23,0.455328851938,23.23,0.360179662704
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,200000,200000,dropout+label_smoothing,0.3,0.925338685513,1.19,0.916131496429,14.84,0.903986752033,21,0.886593520641,21.99,0.860998094082,22.58,0.821913003922,22.62,0.758100569248,22.73,0.671186745167,22.72,0.572533428669,22.72,0.471161454916,22.67,0.37476810813
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,200000,200000,label_smoothing,0,0.922278642654,0.2,0.916066110134,4.04,0.907059669495,17.41,0.893008470535,21.39,0.870860517025,22.39,0.83442735672,22.66,0.771478295326,22.76,0.685462653637,22.78,0.586936175823,22.74,0.484798282385,22.74,0.386560082436
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,200000,200000,none,0.14,0.91756862402,1.08,0.910567641258,11.06,0.900397479534,20,0.884812772274,22.08,0.860984742641,22.71,0.823223531246,23.01,0.761095583439,23.18,0.673795044422,23.13,0.572232544422,23.27,0.467716127634,23.3,0.369058847427
sparse_transformer_variational_dropout,8.88888888889e-8,linear,300000,200000,dropout+label_smoothing,14.22,0.884540736675,20.68,0.872508704662,21.99,0.856502234936,22.55,0.835735619068,22.86,0.807879388332,23.04,0.765786707401,23.24,0.700429618359,23.16,0.616638243198,23.26,0.522412598133,23.29,0.426478326321,23.26,0.336538821459
sparse_transformer_variational_dropout,8.88888888889e-8,linear,300000,200000,label_smoothing,8.92,0.860337853432,18.5,0.851782977581,21.19,0.839960753918,22.47,0.823655843735,22.97,0.800185263157,23.42,0.761509358883,23.63,0.698957443237,23.85,0.617177546024,23.92,0.524400174618,23.96,0.429842233658,23.89,0.340882062912
sparse_transformer_variational_dropout,8.88888888889e-8,linear,300000,200000,none,14.6,0.84109300375,20.51,0.831154644489,22.09,0.818544149399,22.88,0.802288353443,23.48,0.77963757515,23.51,0.743510782719,23.67,0.684455752373,23.75,0.603761076927,23.74,0.510105729103,23.84,0.414301395416,23.8,0.325328141451
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,300000,200000,dropout+label_smoothing,5.3,0.903945624828,17.93,0.893617808819,21.17,0.879477798939,22.13,0.860239923,22.41,0.833273112774,22.47,0.791351497173,22.5,0.724921762943,22.53,0.639001369476,22.58,0.541853606701,22.48,0.442413598299,22.48,0.348499715328
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,300000,200000,label_smoothing,1.88,0.886896371841,11.69,0.880061149597,19.76,0.869764268398,21.95,0.854511022568,22.8,0.83137691021,23.25,0.792330265045,23.32,0.728150188923,23.32,0.643669307232,23.36,0.547231793404,23.43,0.447684466839,23.38,0.353165358305
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,300000,200000,none,2.79,0.876834511757,13.1,0.869387209415,20.01,0.858504652977,22.35,0.842862486839,22.99,0.819758892059,23.4,0.782143473625,23.47,0.720315694809,23.48,0.63579082489,23.57,0.537719666958,23.59,0.437051743269,23.6,0.342917054892
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,200000,dropout+label_smoothing,0.92,0.857601106167,17.02,0.837008237839,23.29,0.808384478092,24.17,0.767549574375,24.44,0.711572170258,24.67,0.639451742172,24.63,0.552017092705,24.69,0.454792737961,24.63,0.364845067263,24.65,0.288924843073,24.69,0.226447612047
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,200000,label_smoothing,1.59,0.863357961178,15.35,0.846841812134,22.58,0.822279155254,24.38,0.785619914532,24.88,0.733470201492,25.03,0.66379982233,25.07,0.576759636402,25.05,0.480598658323,25.09,0.393161207438,25.09,0.319290041924,25,0.257915735245
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,200000,none,1.12,0.850210726261,15.48,0.833566725254,22.94,0.808739840984,24.4,0.771360874176,24.87,0.717847108841,24.97,0.647235631943,25.22,0.56208217144,25.16,0.468401223421,25.09,0.381271451712,25.18,0.308055728674,25.2,0.248223274946
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,200000,dropout+label_smoothing,0.81,0.872429609299,14.41,0.854323327541,22.66,0.828438997269,23.76,0.790361225605,24.03,0.737351834774,24.18,0.668446600437,24.19,0.584826171398,24.26,0.490048140287,24.17,0.400551140308,24.18,0.325233191252,24.2,0.263460874557
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,200000,label_smoothing,0.98,0.883359014988,12.41,0.869441509247,21.69,0.8478038311,23.6,0.814012944698,24.2,0.764841735363,24.5,0.698812365532,24.52,0.616511702538,24.54,0.523490190506,24.58,0.437646627426,24.5,0.365974515676,24.53,0.307051360607
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,200000,none,0.73,0.874017894268,12.08,0.860415279865,21.8,0.838624954224,23.7,0.803917527199,24.22,0.753031790257,24.38,0.685704112053,24.45,0.604372859001,24.55,0.513648033142,24.54,0.427038490772,24.52,0.354551851749,24.44,0.295630156994
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,200000,dropout+label_smoothing,10.84,0.831079602242,22.5,0.806061983109,24.2,0.77294844389,24.67,0.728753089905,24.84,0.670165896416,24.86,0.594693660736,24.84,0.502508342266,24.87,0.408017337322,24.81,0.322688579559,24.8,0.249975159764,24.81,0.190268680453
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,200000,label_smoothing,12.06,0.824150264263,21.43,0.802502453327,23.73,0.772815346718,24.69,0.731922388077,25,0.675682127476,25.11,0.600714564323,25.06,0.508331179619,25.09,0.414590954781,25.05,0.329961687326,25.08,0.257743239403,25.04,0.198084816337
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,200000,none,16.27,0.797360181808,21.97,0.775567829609,24.03,0.746281981468,24.57,0.705712854862,24.78,0.649438381195,24.98,0.575687468052,24.92,0.48682513833,24.99,0.39547175169,24.98,0.312684983015,24.97,0.242334112525,24.94,0.184876650572
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,200000,dropout+label_smoothing,3.52,0.842599451542,21.12,0.819359719753,23.98,0.787715733051,24.42,0.744356930256,24.65,0.686125576496,24.66,0.610565900803,24.69,0.517749011517,24.68,0.421319186687,24.83,0.334036827087,24.77,0.259550213814,24.78,0.198235720396
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,200000,label_smoothing,3.17,0.842521011829,17.71,0.822733938694,23.04,0.794494986534,24.33,0.754336714745,24.75,0.698157310486,24.89,0.62284475565,25.07,0.528916478157,25.06,0.432546794415,25.13,0.345417022705,25.08,0.27097594738,25.1,0.209116622806
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,200000,none,7.39,0.822305500507,20.53,0.802177071571,23.92,0.773653328419,24.71,0.732865452766,25.13,0.675757706165,25.24,0.60072261095,25.16,0.509871304035,25.33,0.415082812309,25.36,0.328915268183,25.3,0.255538016558,25.35,0.195273756981
sparse_transformer_variational_dropout,2.22222222222e-8,linear,200000,200000,dropout+label_smoothing,22.99,0.796274840832,24.53,0.770045161247,25.04,0.737013220787,25.1,0.693920254707,25.21,0.636463224888,25.35,0.56093364954,25.39,0.470512032509,25.34,0.380675345659,25.31,0.299898296595,25.28,0.231170907617,25.34,0.175108030438
sparse_transformer_variational_dropout,2.22222222222e-8,linear,200000,200000,label_smoothing,22.25,0.755941927433,24.01,0.733748376369,24.95,0.705672979355,25.27,0.667606949806,25.39,0.614356637001,25.54,0.541414856911,25.6,0.453813970089,25.62,0.366922289133,25.64,0.289120495319,25.67,0.223554581404,25.69,0.170114383101
sparse_transformer_variational_dropout,2.22222222222e-8,linear,200000,200000,none,23.18,0.703182220459,24.34,0.681478023529,24.83,0.65527677536,25.1,0.6196372509,25.22,0.569209933281,25.26,0.50116944313,25.34,0.419811278582,25.34,0.338473945856,25.28,0.265296131372,25.3,0.203783705831,25.31,0.15424926579
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,200000,200000,dropout+label_smoothing,21.65,0.81526196003,24.06,0.789654612541,24.97,0.756491959095,25.32,0.712760865688,25.36,0.654308378696,25.42,0.577589154243,25.43,0.485329300165,25.46,0.393237680197,25.5,0.310117930174,25.51,0.23932094872,25.47,0.181375086308
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,200000,200000,label_smoothing,19.33,0.795756220818,23.11,0.774313986301,24.5,0.745612561703,25.14,0.706016838551,25.34,0.650759994984,25.51,0.575501859188,25.56,0.484519004822,25.58,0.393772810698,25.51,0.311905920506,25.54,0.242345064878,25.54,0.185336410999
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,200000,200000,none,20.45,0.757107019424,23.33,0.73539441824,24.41,0.707487404346,24.91,0.66904515028,24.94,0.614998579025,25.14,0.542688250542,25.05,0.455966800451,25.08,0.368592023849,25.1,0.289652645588,25.07,0.222841367126,25.06,0.168646737933
sparse_transformer_variational_dropout,2.22222222222e-8,linear,300000,200000,dropout+label_smoothing,25.63,0.707429409027,25.82,0.688003599644,25.95,0.66466653347,25.96,0.63249874115,25.95,0.585432529449,25.93,0.517961978912,25.94,0.435707718134,26,0.352898329496,26.02,0.277790009975,26.03,0.213953256607,26.04,0.161937490106
sparse_transformer_variational_dropout,2.22222222222e-8,linear,300000,200000,label_smoothing,25.23,0.569544494152,25.34,0.553877592087,25.41,0.535616874695,25.55,0.509423136711,25.47,0.469079375267,25.49,0.409854114056,25.55,0.339700609446,25.57,0.271539479494,25.49,0.211921706796,25.49,0.162473216653,25.49,0.122732684016
sparse_transformer_variational_dropout,2.22222222222e-8,linear,300000,200000,none,24.45,0.48943015933,24.36,0.475115865469,24.37,0.457518994808,24.48,0.431640684605,24.56,0.393237411976,24.52,0.340758889914,24.47,0.280902028084,24.46,0.223722800612,24.47,0.17429934442,24.47,0.133967265487,24.49,0.102013327181
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,300000,200000,dropout+label_smoothing,24.87,0.763625383377,25.4,0.740576684475,25.61,0.71135443449,25.66,0.671855211258,25.66,0.61694586277,25.7,0.542274057865,25.67,0.454051345587,25.62,0.366699337959,25.66,0.288194894791,25.65,0.221791043878,25.69,0.16770388186
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,300000,200000,label_smoothing,24.26,0.685510218143,24.95,0.666497886181,25.15,0.643516659737,25.3,0.611433029175,25.36,0.563915491104,25.47,0.495877504349,25.38,0.414674460888,25.4,0.334418088198,25.34,0.263060927391,25.35,0.203222021461,25.35,0.154756709933
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,300000,200000,none,24.02,0.613601028919,24.39,0.595009982586,24.43,0.573089301586,24.59,0.542506158352,24.69,0.497676491737,24.65,0.435935020447,24.63,0.363316893578,24.59,0.291522920132,24.59,0.227716803551,24.52,0.174736082554,24.51,0.132419124246
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,300000,dropout+label_smoothing,0.14,0.973820924759,0.13,0.969300270081,0.21,0.964470088482,0.68,0.95869320631,9.63,0.950367391109,18.26,0.936807513237,19.12,0.914394140244,19.36,0.874761879444,19.36,0.807913482189,19.39,0.725023627281,19.46,0.640460968018
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,300000,label_smoothing,0.1,0.976145505905,0.1,0.972773253918,0.05,0.968942403793,0.37,0.964009225368,10.01,0.956329107285,18.71,0.943241715431,19.86,0.920801758766,20.39,0.879614770412,20.61,0.811792135239,20.74,0.732246160507,20.74,0.6541903615
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,300000,none,0,0.973052442074,0.11,0.969623804092,0.22,0.965717256069,1.63,0.960549175739,15.3,0.952226698399,19.41,0.937853693962,20.27,0.913313210011,20.63,0.8707498312,20.7,0.80257499218,20.67,0.721341371536,20.79,0.642461836338
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,300000,dropout+label_smoothing,0.13,0.977482497692,0.17,0.973924815655,0.16,0.970174133778,0.46,0.965593695641,10.26,0.958737790585,18.27,0.947089314461,18.88,0.927505612373,19.08,0.893434345722,19.17,0.833797097206,19.15,0.754025161266,19.15,0.671866118908
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,300000,label_smoothing,0.04,0.979995667934,0.05,0.977497220039,0.03,0.974640965462,0.29,0.970810472965,7.28,0.964436650276,17.67,0.953012228012,19.49,0.933412730694,19.74,0.898155212402,19.91,0.837118387222,20.12,0.760461270809,20.16,0.685554027557
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,300000,none,0.12,0.97732681036,0.12,0.974509894848,0.1,0.971295654774,1.06,0.966900527477,14.87,0.959536194801,19.24,0.946607232094,19.97,0.924576342106,20.57,0.88650739193,20.61,0.823691546917,20.72,0.744538366795,20.86,0.667255938053
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,300000,dropout+label_smoothing,0.09,0.961119413376,0.16,0.95603877306,0.25,0.950217783451,1.27,0.942755639553,16.29,0.931769013405,19.43,0.914388895035,19.88,0.884691655636,19.96,0.831150352955,20.18,0.755496740341,20.19,0.666085958481,20.26,0.568993151188
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,300000,label_smoothing,0.04,0.961057841778,0.07,0.957548141479,0.07,0.95326089859,1.96,0.947313666344,14.35,0.937875509262,19.11,0.921857595444,20.16,0.891879141331,20.79,0.836524128914,20.93,0.760503351688,20.84,0.671799063683,20.81,0.575645506382
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,300000,none,0.05,0.958880364895,0.07,0.955073237419,0.19,0.950373411179,1.4,0.943738222122,16.23,0.933205902576,19.92,0.915892243385,20.98,0.886017501354,21.37,0.83266723156,21.43,0.754985570908,21.54,0.662177026272,21.55,0.562564432621
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,300000,dropout+label_smoothing,0.09,0.965478599072,0.19,0.961401462555,0.36,0.956784129143,1.1,0.950843036175,12.73,0.941822350025,18.69,0.926663339138,19.62,0.900052607059,19.9,0.849946975708,20.01,0.774765431881,20.11,0.684437453747,20.05,0.585758268833
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,300000,label_smoothing,0.04,0.966225743294,0.05,0.963504135609,0.12,0.960125744343,1.16,0.955253005028,14.47,0.947050452232,19.21,0.932697474957,20.13,0.905895471573,20.44,0.853432059288,20.79,0.776481091976,20.82,0.685250818729,20.86,0.585824906826
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,300000,none,0.03,0.964491844177,0.04,0.961449921131,0.07,0.957704782486,1.25,0.952325701714,14.25,0.943360984325,19.39,0.927802741528,20.62,0.900230050087,20.93,0.849405646324,21.09,0.771502315998,21.19,0.676482796669,21.2,0.574156165123
sparse_transformer_variational_dropout,2.22222222222e-7,linear,200000,300000,dropout+label_smoothing,0.1,0.945888996124,0.22,0.940551400185,0.75,0.933788716793,12.44,0.924574017525,19.09,0.911173343658,20.06,0.890807271004,20.55,0.854570448399,20.61,0.796390354633,20.65,0.719516038895,20.67,0.62742638588,20.71,0.525476515293
sparse_transformer_variational_dropout,2.22222222222e-7,linear,200000,300000,label_smoothing,0.05,0.939060389996,0.06,0.93570125103,0.37,0.931059479713,7.61,0.924107372761,18.49,0.913082182407,20.49,0.894743204117,21.24,0.858938992023,21.53,0.801092624664,21.66,0.724920868874,21.6,0.633478522301,21.77,0.53127348423
sparse_transformer_variational_dropout,2.22222222222e-7,linear,200000,300000,none,0.08,0.936432421207,0.1,0.932803452015,0.42,0.927727341652,8.93,0.920099973679,18.99,0.90822327137,20.98,0.889358818531,21.68,0.855823516846,21.84,0.799662649632,22.08,0.721481323242,22.18,0.625955939293,22.14,0.520369589329
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,200000,300000,dropout+label_smoothing,0.13,0.953574955463,0.2,0.949516534805,0.43,0.944450557232,4.98,0.937396168709,18.13,0.926441192627,19.62,0.908657133579,20.13,0.875758528709,20.2,0.819016337395,20.27,0.741468429565,20.29,0.646751224995,20.28,0.5403200984
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,200000,300000,label_smoothing,0.04,0.947403728962,0.05,0.944988131523,0.11,0.941706418991,0.88,0.936617970467,12.69,0.92783755064,19.55,0.911999285221,20.64,0.879415392876,21.07,0.822619378567,21.17,0.744834899902,21.31,0.649202764034,21.45,0.54052323103
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,200000,300000,none,0,0.946064949036,0.14,0.943382561207,0.64,0.939625263214,6.96,0.933768928051,17.69,0.923860371113,20.26,0.906895518303,21.06,0.875197350979,21.31,0.818918764591,21.56,0.737753689289,21.56,0.636979937553,21.46,0.524919867516
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,300000,dropout+label_smoothing,0.13,0.964269578457,0.14,0.958219647408,0.36,0.951625823975,2.41,0.943324148655,17.66,0.930914282799,19.91,0.911140561104,20.33,0.879416286945,20.44,0.825906693935,20.54,0.745877385139,20.43,0.657055795193,20.52,0.570997595787
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,300000,label_smoothing,0.06,0.967939794064,0.04,0.963704824448,0.1,0.958817362785,0.7,0.952146351337,14.82,0.941240012646,19.75,0.922757863998,20.71,0.891701042652,21.12,0.837504327297,21.29,0.759547412395,21.26,0.677126049995,21.28,0.59989631176
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,300000,none,0.05,0.964396834373,0.11,0.959925532341,0.36,0.954678416252,4.25,0.947400927544,18.62,0.935489118099,20.88,0.915537834167,21.43,0.882643699646,21.77,0.828367352486,21.78,0.749496340752,21.8,0.663652002811,21.73,0.583706438541
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,300000,dropout+label_smoothing,0.15,0.969288527966,0.17,0.9645652771,0.23,0.959475517273,2.3,0.953028082848,16.9,0.942942321301,19.44,0.925982296467,19.79,0.89823538065,19.91,0.851508617401,19.99,0.77749890089,19.95,0.690432310104,19.94,0.606712698936
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,300000,label_smoothing,0.06,0.972924411297,0.08,0.969604253769,0.26,0.96572893858,3.22,0.960266709328,16.56,0.950922906399,19.72,0.93460637331,20.51,0.907115876675,20.65,0.859336316586,20.91,0.785673260689,21.02,0.704251468182,20.97,0.629137098789
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,300000,none,0.03,0.969621360302,0.06,0.966165482998,0.27,0.962050795555,7.02,0.956085085869,18.5,0.945814013481,20.29,0.928064584732,20.97,0.898355424404,21.22,0.849131345749,21.16,0.775459706783,21.22,0.692432820797,21.26,0.616164445877
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,300000,dropout+label_smoothing,0.15,0.950906217098,0.21,0.944040298462,0.54,0.936015844345,8.67,0.925409555435,19.49,0.909726798534,20.41,0.885568201542,20.8,0.845314264297,20.83,0.778796851635,20.91,0.693229615688,20.88,0.598019659519,20.94,0.500476002693
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,300000,label_smoothing,0.15,0.951626121998,0.08,0.946746349335,0.19,0.940640211105,3.44,0.931985557079,17.61,0.918241381645,20.57,0.895637392998,21.4,0.85481774807,21.72,0.78709936142,21.64,0.701734542847,21.88,0.607553064823,21.74,0.510891139507
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,300000,none,0,0.949056386948,0.08,0.943709731102,0.27,0.936936974525,5.31,0.927238643169,18.58,0.91204303503,20.73,0.887841403484,21.55,0.847195923328,21.93,0.780443608761,21.95,0.692577123642,22.14,0.594930291176,22.28,0.496130824089
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,300000,dropout+label_smoothing,0.09,0.956334114075,0.13,0.950741767883,0.26,0.944243550301,4.49,0.935518085957,18.81,0.922029674053,20.13,0.900310516357,20.54,0.863353312016,20.64,0.799509644508,20.71,0.713726818562,20.73,0.617614626884,20.7,0.518630445004
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,300000,label_smoothing,0.05,0.958106637001,0.04,0.95423668623,0.08,0.949361562729,1.06,0.942145228386,16.26,0.930068731308,20.46,0.909366250038,21.13,0.871527373791,21.31,0.805080294609,21.47,0.718364834785,21.56,0.622392296791,21.66,0.523639142513
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,300000,none,0.08,0.955410003662,0.14,0.95122975111,0.34,0.945941925049,4.65,0.938065588474,18.55,0.9249740839,20.9,0.903095901012,21.62,0.865506350994,21.82,0.801189243793,21.84,0.712868869305,21.99,0.613494992256,21.96,0.512812793255
sparse_transformer_variational_dropout,1.55555555556e-7,linear,200000,300000,dropout+label_smoothing,0.16,0.934155583382,0.72,0.926700890064,8.97,0.917093575001,19.25,0.90392768383,20.8,0.885278224945,21.25,0.857586920261,21.45,0.810473680496,21.61,0.740955173969,21.63,0.65462744236,21.64,0.557433962822,21.72,0.456730931997
sparse_transformer_variational_dropout,1.55555555556e-7,linear,200000,300000,label_smoothing,0.09,0.927653253078,0.27,0.92268383503,2.17,0.915711820126,15.68,0.905300438404,20.01,0.889439105988,21.33,0.863799095154,21.99,0.817063331604,22.1,0.747934579849,22.19,0.662329256535,22.23,0.565940439701,22.26,0.46532997489
sparse_transformer_variational_dropout,1.55555555556e-7,linear,200000,300000,none,0.12,0.92367041111,0.36,0.918156087399,3.49,0.910355687141,16.81,0.898907661438,20.92,0.88201791048,21.92,0.855907797813,22.3,0.811126887798,22.38,0.742193460464,22.47,0.653512120247,22.49,0.553181231022,22.58,0.450176775455
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,200000,300000,dropout+label_smoothing,0.07,0.943807780743,0.2,0.937946140766,1.15,0.930474698544,14.55,0.919950306416,19.72,0.90400159359,20.66,0.878850579262,21.01,0.834254801273,21.12,0.764702737331,21.1,0.676424920559,21.18,0.576061606407,21.15,0.471175909042
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,200000,300000,label_smoothing,0.1,0.938605964184,0.12,0.934920787811,0.49,0.929761946201,8.47,0.921655476093,18.85,0.90827280283,21.08,0.885385096073,21.46,0.84143280983,22,0.772136449814,22.26,0.683700740337,22.32,0.582308530807,22.33,0.475274950266
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,200000,300000,none,0.05,0.936176240444,0.14,0.932066440582,0.71,0.92626452446,11.88,0.917194187641,20.08,0.902522802353,21.66,0.878418505192,22.05,0.835441529751,22.24,0.765919148922,22.28,0.674335956573,22.29,0.569452226162,22.33,0.461180061102
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,300000,dropout+label_smoothing,0.19,0.943876445293,0.24,0.934820175171,1.08,0.924499869347,16.94,0.91064375639,20.87,0.88954937458,21.71,0.857379078865,21.77,0.808485150337,21.98,0.733578085899,21.99,0.639918446541,21.99,0.546985626221,22.07,0.462001413107
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,300000,label_smoothing,0.1,0.949047625065,0.23,0.942473053932,2.15,0.93439245224,16.56,0.922591805458,20.84,0.903423309326,22.02,0.872865617275,22.43,0.824373424053,22.61,0.749590337276,22.53,0.660726308823,22.62,0.575580716133,22.57,0.499057352543
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,300000,none,0.03,0.943998396397,0.1,0.937199950218,2.09,0.928711295128,17.08,0.916086018085,21.5,0.89562022686,22.58,0.863239586353,22.86,0.813366413116,22.8,0.740019142628,22.95,0.649756491184,22.89,0.561988830566,22.87,0.484100162983
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,300000,dropout+label_smoothing,0.13,0.951253712177,0.2,0.944042086601,0.71,0.935740292072,13.15,0.924136161804,20.54,0.905720889568,21.28,0.876749932766,21.48,0.832214236259,21.55,0.763622939587,21.5,0.673026621342,21.58,0.582143306732,21.59,0.500322520733
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,300000,label_smoothing,0.06,0.956844389439,0.08,0.951519668102,0.78,0.944931566715,14.55,0.935005068779,20.6,0.918082475662,21.66,0.890303552151,22.22,0.846154510975,22.31,0.777164518833,22.47,0.689961135387,22.44,0.606224119663,22.46,0.532758355141
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,300000,none,0.11,0.953068733215,0.22,0.947998642921,2.68,0.941407263279,17.22,0.930974245071,20.88,0.913208186626,21.9,0.884201824665,22.43,0.838954389095,22.5,0.771569132805,22.56,0.685341000557,22.68,0.600489914417,22.61,0.526815891266
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,300000,dropout+label_smoothing,0.18,0.929144561291,0.46,0.918391883373,6.19,0.905246019363,20.16,0.887270927429,21.68,0.861345171928,21.93,0.823165953159,21.99,0.76318949461,22.11,0.67833429575,22.18,0.582372009754,22.19,0.48533821106,22.12,0.393779754639
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,300000,label_smoothing,0,0.931397438049,0.1,0.923379838467,1.94,0.912748754025,17.07,0.89708173275,21.55,0.873219072819,22.43,0.836263656616,22.87,0.775327265263,23.02,0.690946280956,23.06,0.597019851208,23.02,0.502346515656,23.07,0.412342071533
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,300000,none,0.04,0.92585670948,0.25,0.917111814022,6.47,0.905556857586,19.28,0.88879430294,21.77,0.863807201385,22.79,0.825829684734,22.86,0.766205251217,23.21,0.681764662266,23.2,0.585106492043,23.14,0.487825810909,23.16,0.396614789963
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,300000,dropout+label_smoothing,0.13,0.936484694481,0.26,0.927573502064,1.35,0.916718780994,17.01,0.901426494122,21.11,0.878114283085,21.8,0.84243196249,22.07,0.785242795944,22.17,0.700814902782,22.25,0.603481471539,22.23,0.504836797714,22.25,0.411694407463
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,300000,label_smoothing,0,0.93991202116,0.06,0.933519184589,0.41,0.925089359283,10.84,0.912261545658,20.73,0.891493916512,22.19,0.857746481895,22.57,0.800202548504,22.74,0.715636134148,22.87,0.61944848299,22.82,0.52199691534,22.73,0.429088890553
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,300000,none,0.05,0.936045050621,0.25,0.929090023041,5.06,0.91973054409,18.46,0.905454456806,21.46,0.883085906506,22.52,0.847808241844,22.88,0.791189074516,22.87,0.707592308521,22.91,0.609307706356,22.98,0.509576797485,23.02,0.415833085775
sparse_transformer_variational_dropout,8.88888888889e-8,linear,200000,300000,dropout+label_smoothing,0.58,0.907935619354,8.15,0.895817279816,20.42,0.879951179028,22.24,0.858943939209,22.66,0.830575525761,22.94,0.78939896822,22.89,0.724501907825,22.86,0.639469027519,22.96,0.544013619423,23.01,0.446780532598,23.1,0.355053305626
sparse_transformer_variational_dropout,8.88888888889e-8,linear,200000,300000,label_smoothing,0.27,0.900697767735,3.86,0.891725122929,17.9,0.879110813141,21.46,0.861313581467,22.65,0.835927128792,23.11,0.796452701092,23.37,0.732062041759,23.33,0.648025333881,23.51,0.553568661213,23.48,0.457117676735,23.52,0.36524310708
sparse_transformer_variational_dropout,8.88888888889e-8,linear,200000,300000,none,0.98,0.891255438328,11.21,0.881507158279,19.41,0.868150889874,21.88,0.849774897099,22.92,0.8240416646,23.34,0.785064697266,23.53,0.722900509834,23.68,0.638797998428,23.6,0.542563319206,23.66,0.44443321228,23.65,0.352536648512
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,200000,300000,dropout+label_smoothing,0.23,0.921594083309,0.87,0.911100327969,12.79,0.89697188139,21.03,0.876662492752,21.95,0.847183763981,22.28,0.803531825542,22.44,0.735645711422,22.48,0.646702945232,22.46,0.547908604145,22.45,0.448411494493,22.52,0.355248451233
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,200000,300000,label_smoothing,0.15,0.918336391449,0.52,0.911454379559,7.04,0.901565790176,19.51,0.886503756046,21.92,0.863265037537,22.74,0.825545310974,23.16,0.761712908745,23.27,0.675879657269,23.19,0.578262805939,23.16,0.477575957775,23.2,0.380857855082
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,200000,300000,none,0.11,0.913143932819,0.83,0.905529499054,11.88,0.894625425339,20.69,0.878419399261,22.5,0.854129433632,22.85,0.816045463085,23.14,0.753968119621,23.19,0.667577922344,23.25,0.567458868027,23.41,0.464667588472,23.45,0.367637455463
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,300000,dropout+label_smoothing,2.24,0.847104668617,19.74,0.824926197529,23.57,0.794803619385,24.34,0.752880275249,24.46,0.69639724493,24.53,0.623890280724,24.56,0.535886228085,24.61,0.439041286707,24.6,0.350362062454,24.6,0.275112181902,24.58,0.213227272034
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,300000,label_smoothing,2.47,0.847924351692,17.49,0.829746127129,23.26,0.803604006767,24.35,0.765769839287,24.85,0.712737858295,25.13,0.642350912094,25.13,0.554494559765,25.16,0.459180682898,25.1,0.372985064983,25.14,0.300026297569,25.08,0.239632919431
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,300000,none,7.26,0.829968988895,20.78,0.811558187008,23.81,0.785143256187,24.75,0.746748447418,24.98,0.692362129688,25.15,0.620975732803,25.32,0.534657001495,25.28,0.44067338109,25.3,0.354252487421,25.32,0.281701892614,25.37,0.222412288189
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,300000,dropout+label_smoothing,0.87,0.865615606308,15.74,0.84656471014,22.87,0.819663584232,24.09,0.780516803265,24.33,0.726225912571,24.41,0.655933737755,24.45,0.570476293564,24.45,0.47408926487,24.53,0.383802980185,24.57,0.307644814253,24.64,0.245092689991
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,300000,label_smoothing,0.59,0.874766111374,8.47,0.860102117062,21.74,0.837570488453,24.33,0.802734196186,24.62,0.752350091934,24.8,0.684815168381,24.73,0.600449085236,24.76,0.505684912205,24.75,0.418812185526,24.75,0.345938920975,24.76,0.28584164381
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,300000,none,2.17,0.863528847694,16.5,0.848739266396,22.61,0.825724303722,23.97,0.789969980717,24.51,0.737921893597,24.44,0.669098258018,24.56,0.58592569828,24.56,0.49362668395,24.62,0.406474024057,24.63,0.33345913887,24.57,0.273891627789
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,300000,dropout+label_smoothing,19.15,0.816881477833,23.8,0.790663361549,24.78,0.756863176823,25.18,0.712634086609,25.22,0.654437601566,25.23,0.579516947269,25.2,0.488451570272,25.23,0.395862221718,25.22,0.312650412321,25.16,0.241908818483,25.2,0.184104308486
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,300000,label_smoothing,15.97,0.799038469791,22.6,0.776077985764,24.38,0.745907962322,24.99,0.70520824194,25.38,0.649724900723,25.42,0.575753629208,25.41,0.485070049763,25.4,0.394066393375,25.45,0.31236949563,25.47,0.243107452989,25.51,0.186357557774
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,300000,none,20.4,0.762172162533,23.73,0.739774405956,24.93,0.711055219173,25.23,0.671898186207,25.51,0.617660284042,25.56,0.546222865582,25.59,0.460159748793,25.52,0.372452020645,25.47,0.293443888426,25.47,0.226586461067,25.44,0.172438800335
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,300000,dropout+label_smoothing,6.66,0.837429702282,21.76,0.813626289368,23.92,0.781566262245,24.52,0.73811173439,24.74,0.679974019527,24.71,0.604712188244,24.67,0.512267529964,24.73,0.416864514351,24.64,0.330550789833,24.64,0.256878525019,24.68,0.196167588234
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,300000,label_smoothing,2.51,0.833659231663,18.68,0.812946677208,23.29,0.784009337425,24.55,0.74338310957,25.09,0.687068879604,25.17,0.611874759197,25.3,0.518685996532,25.25,0.423730760813,25.36,0.338201671839,25.3,0.265195071697,25.28,0.204774990678
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,300000,none,11.55,0.810985147953,20.86,0.790111660957,23.61,0.761224210262,24.56,0.72043043375,24.96,0.663669705391,24.96,0.589287936687,25.25,0.499282300472,25.17,0.406073451042,25.4,0.321577072144,25.32,0.249794512987,25.29,0.191088423133
sparse_transformer_variational_dropout,2.22222222222e-8,linear,200000,300000,dropout+label_smoothing,24.65,0.762913584709,25.3,0.739038109779,25.5,0.709504723549,25.5,0.670442163944,25.63,0.617121994495,25.58,0.545140326023,25.58,0.457688510418,25.66,0.370299726725,25.64,0.291404217482,25.62,0.224420800805,25.63,0.169834390283
sparse_transformer_variational_dropout,2.22222222222e-8,linear,200000,300000,label_smoothing,24.44,0.686501502991,25.32,0.666198968887,25.75,0.642094671726,25.79,0.609262406826,25.98,0.561556756496,26.01,0.494234740734,26.04,0.41271263361,26.05,0.332087904215,26.05,0.260545104742,26.07,0.200637727976,26.06,0.15216563642
sparse_transformer_variational_dropout,2.22222222222e-8,linear,200000,300000,none,24.29,0.613419473171,24.69,0.594093501568,24.91,0.571712374687,24.98,0.540947139263,24.93,0.496254324913,24.84,0.434938013554,24.81,0.361951053143,24.8,0.289698958397,24.72,0.225616574287,24.72,0.172387525439,24.7,0.129932150245
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,200000,300000,dropout+label_smoothing,22.12,0.806685388088,24.41,0.780927181244,24.67,0.748012959957,24.99,0.704814076424,25.19,0.647129893303,25.31,0.571214854717,25.33,0.479886591434,25.29,0.388671994209,25.28,0.306455880404,25.25,0.236443474889,25.25,0.179248139262
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,200000,300000,label_smoothing,21.04,0.777033686638,23.78,0.755036652088,24.69,0.726370692253,25.29,0.687332868576,25.36,0.632894217968,25.56,0.558601677418,25.68,0.468821376562,25.64,0.379672557116,25.64,0.299568623304,25.68,0.231702595949,25.58,0.176198467612
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,200000,300000,none,21.87,0.733025431633,23.69,0.711428761482,24.48,0.684608519077,24.79,0.647848010063,24.89,0.595833599567,24.83,0.525871038437,24.92,0.442003190517,24.93,0.357655912638,24.94,0.281600654125,25,0.21744145453,24.94,0.165604367852
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,400000,dropout+label_smoothing,0.13,0.971401929855,0.19,0.966197192669,0.29,0.960625052452,1.52,0.953983366489,14.77,0.944582223892,18.88,0.929797232151,19.58,0.905902147293,19.76,0.863921284676,19.72,0.79483127594,19.8,0.711292386055,19.84,0.625875413418
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,400000,label_smoothing,0,0.973492145538,0.12,0.969624757767,0.32,0.965315461159,1.72,0.959826529026,12.44,0.951406955719,18.89,0.937415957451,20.08,0.91352057457,20.48,0.869358599186,20.49,0.799306809902,20.61,0.719510316849,20.59,0.641273498535
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,400000,none,0,0.970427155495,0.05,0.96651661396,0.14,0.962077200413,2.33,0.95626860857,16.6,0.94718170166,19.83,0.931975364685,20.79,0.906509101391,21.01,0.862342476845,21.18,0.792496263981,21.2,0.710479795933,21.36,0.630436003208
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,400000,dropout+label_smoothing,0.26,0.976285398006,0.29,0.972462654114,0.33,0.968407154083,1.05,0.96351391077,12.71,0.956233799458,17.96,0.944110929966,18.86,0.923828661442,19.29,0.888395428658,19.41,0.826700329781,19.42,0.745645225048,19.43,0.662651836872
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,400000,label_smoothing,0.04,0.978702664375,0.04,0.975968122482,0.05,0.972891509533,0.89,0.968842327595,9.5,0.96226477623,18.07,0.950588405132,19.76,0.930358290672,20.2,0.893526077271,20.34,0.830167293549,20.38,0.752269387245,20.41,0.676084578037
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,400000,none,0.13,0.976102292538,0.18,0.973167657852,0.21,0.969820022583,1.56,0.965259194374,13.81,0.957679867744,19.34,0.944437086582,20.41,0.921911418438,20.78,0.882833182812,20.87,0.818622887135,20.72,0.738550305367,20.98,0.66014534235
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,400000,dropout+label_smoothing,0.13,0.957304120064,0.16,0.951555073261,0.28,0.944928526878,3.43,0.936512947083,17.39,0.92436414957,19.45,0.905777096748,20.15,0.874546647072,20.38,0.81953638792,20.43,0.743813157082,20.47,0.654686272144,20.54,0.558143615723
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,400000,label_smoothing,0.06,0.956868708134,0,0.952837765217,0.15,0.947916209698,1.38,0.941205084324,14.38,0.930806994438,19.5,0.913693368435,20.8,0.881986498833,21.1,0.825216472149,21.25,0.749038040638,21.32,0.660627305508,21.42,0.565034270287
sparse_transformer_variational_dropout,2.22222222222e-7,linear,100000,400000,none,0.1,0.95442289114,0.15,0.950009346008,0.79,0.94454729557,8.6,0.937034547329,18.63,0.925505936146,20.23,0.90717625618,21,0.875931918621,21.28,0.821058213711,21.42,0.743147492409,21.47,0.650921583176,21.56,0.552298247814
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,400000,dropout+label_smoothing,0.06,0.964071154594,0.13,0.95966899395,0.18,0.954701125622,0.54,0.948344707489,10.97,0.938749551773,19.02,0.922974765301,19.77,0.895493805408,20.02,0.84437417984,19.99,0.768933534622,20.1,0.67862534523,20.13,0.580061912537
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,400000,label_smoothing,0.05,0.964671075344,0.06,0.961727380753,0.1,0.958123087883,0.55,0.953073263168,12.51,0.944753110409,18.92,0.930160701275,20.03,0.902546465397,20.48,0.849192380905,20.78,0.772585570812,20.96,0.682115495205,21.01,0.583560585976
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,100000,400000,none,0.04,0.962852358818,0.14,0.959533631802,0.19,0.955443024635,1.07,0.949645638466,15.33,0.940163969994,19.95,0.924167156219,20.86,0.896254777908,21.18,0.845022082329,21.34,0.767333507538,21.45,0.673050284386,21.45,0.571655571461
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,400000,dropout+label_smoothing,0.14,0.9612377882,0.19,0.954443871975,0.39,0.947016656399,4.18,0.937772989273,18.9,0.924169123173,20.12,0.90299898386,20.39,0.869558215141,20.67,0.813437104225,20.68,0.731828570366,20.74,0.642411589622,20.75,0.555320739746
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,400000,label_smoothing,0.11,0.964244008064,0.2,0.959215939045,0.77,0.953450262547,8.23,0.945795893669,18.14,0.93378919363,20.36,0.91407430172,21.22,0.881129682064,21.51,0.823637783527,21.56,0.743703305721,21.68,0.66027200222,21.73,0.581537365913
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,400000,none,0.05,0.960491478443,0.13,0.955350279808,0.53,0.949356019497,7.98,0.941146075726,19.34,0.928132116795,21.11,0.906876146793,21.52,0.8722833395,21.8,0.815527737141,21.97,0.734801828861,21.9,0.64836192131,21.96,0.567724108696
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,400000,dropout+label_smoothing,0.18,0.967629611492,0.23,0.96250140667,0.4,0.9569414258,2.84,0.949917554855,17.31,0.939121246338,19.52,0.921385705471,19.98,0.892491161823,20.19,0.843771100044,20.18,0.767807722092,20.23,0.680154144764,20.25,0.595852375031
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,400000,label_smoothing,0.06,0.971246957779,0.08,0.967748939991,0.1,0.963674008846,1.48,0.957936882973,16.38,0.948230922222,19.85,0.931403338909,20.69,0.90288156271,21.03,0.853007495403,21.21,0.777887821198,21.21,0.696751236916,21.15,0.621868908405
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,400000,none,0,0.967989444733,0.17,0.964344024658,0.53,0.960056245327,7.99,0.953965485096,18.88,0.943590164185,20.7,0.925543010235,21.54,0.895275533199,21.43,0.844942212105,21.62,0.769726157188,21.63,0.685640513897,21.79,0.608041882515
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,400000,dropout+label_smoothing,0.11,0.946377277374,0.25,0.938662588596,1.53,0.929588615894,16.32,0.917741179466,19.94,0.900644600391,20.92,0.875111341476,21.06,0.833122551441,21.09,0.765429377556,21.31,0.679805457592,21.37,0.585104286671,21.38,0.488194078207
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,400000,label_smoothing,0,0.946348190308,0,0.940919339657,0.16,0.934058666229,5.43,0.924405634403,18.75,0.90948677063,21.12,0.885677874088,21.84,0.843194425106,22.16,0.774990260601,22.24,0.690559089184,22.41,0.597826302052,22.32,0.502904951572
sparse_transformer_variational_dropout,1.55555555556e-7,linear,100000,400000,none,0.08,0.942770004272,0.16,0.936763823032,2.13,0.929119467735,15.14,0.918371617794,20.48,0.902197599411,21.92,0.877233147621,22.48,0.835807085037,22.66,0.768733978271,22.58,0.681795418262,22.75,0.585657179356,22.72,0.488540112972
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,400000,dropout+label_smoothing,0.09,0.954721450806,0.13,0.948693990707,0.3,0.941733539104,4.05,0.932430565357,19.01,0.918073475361,20.31,0.895211696625,20.6,0.85669362545,20.74,0.791279375553,20.86,0.704892873764,20.83,0.608673870564,20.89,0.510142922401
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,400000,label_smoothing,0.11,0.956126868725,0.31,0.951967895031,0.72,0.946773588657,6.38,0.939215958118,18.16,0.926767349243,20.67,0.905694425106,21.38,0.866993069649,21.74,0.800180673599,21.88,0.714122593403,21.88,0.619048714638,21.85,0.521401643753
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,100000,400000,none,0,0.953726530075,0.04,0.94923132658,0.35,0.943560361862,5.2,0.935271322727,18.75,0.921737372875,20.88,0.89941161871,21.53,0.861121416092,21.93,0.796158671379,21.89,0.707987904549,21.86,0.6091375947,21.82,0.508929252625
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,400000,dropout+label_smoothing,0.1,0.939122676849,0.17,0.929043769836,2.13,0.917530655861,18.56,0.902159631252,21.34,0.879482448101,21.86,0.845560312271,22.01,0.794347047806,22.12,0.716540336609,22.13,0.621701955795,22.2,0.528069555759,22.13,0.442098408937
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,400000,label_smoothing,0.26,0.943617999554,0.24,0.935813128948,2.69,0.926384985447,17.25,0.912984788418,21.57,0.892057776451,22.48,0.859530329704,22.95,0.808518826962,23.05,0.731236100197,23,0.64148914814,23,0.55558526516,23.12,0.478021889925
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,400000,none,0.07,0.937831878662,0.31,0.930021345615,5.62,0.920415639877,18.65,0.906553268433,21.83,0.884974658489,22.55,0.851503551006,22.9,0.80016374588,22.97,0.724489808083,23.03,0.632411360741,23.08,0.542993724346,23.09,0.462935239077
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,400000,dropout+label_smoothing,0.11,0.948931694031,0.25,0.941169142723,0.81,0.932284414768,13.65,0.920069098473,20.74,0.900923669338,21.47,0.870954930782,21.68,0.824886441231,21.67,0.753973841667,21.72,0.661616802216,21.72,0.569464027882,21.74,0.486041039228
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,400000,label_smoothing,0.06,0.954482197762,0.11,0.949024617672,0.72,0.942287683487,12.56,0.932139754295,20.96,0.915068745613,22.06,0.88708114624,22.43,0.842426598072,22.64,0.772362709045,22.67,0.684785842896,22.56,0.600589871407,22.63,0.5261977911
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,400000,none,0,0.950122833252,0.12,0.944499075413,0.66,0.937380194664,14.08,0.926450848579,21.26,0.907985091209,22.09,0.877783894539,22.54,0.830752193928,22.74,0.761009812355,22.82,0.672790408134,22.83,0.586375832558,22.9,0.510920345783
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,400000,dropout+label_smoothing,0.15,0.92181634903,0.93,0.910071909428,13.16,0.895623266697,21.07,0.876151144505,22.09,0.848885178566,22.44,0.809555590153,22.45,0.748148143291,22.49,0.662728726864,22.64,0.566685676575,22.68,0.469602376223,22.69,0.378297001123
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,400000,label_smoothing,0.1,0.922433197498,0.38,0.913577318192,5.31,0.90198302269,19.15,0.885450959206,22.05,0.861107587814,22.68,0.823854386806,22.96,0.762397766113,23.03,0.677973389626,23.08,0.583982884884,23.07,0.488905578852,23.11,0.398699343204
sparse_transformer_variational_dropout,8.88888888889e-8,linear,100000,400000,none,0.23,0.915825843811,1.75,0.906381607056,13.28,0.893839597702,20.96,0.876094818115,22.42,0.850569844246,23.15,0.812401294708,23.41,0.752565383911,23.56,0.668679535389,23.56,0.572914958,23.6,0.476104110479,23.56,0.385128200054
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,400000,dropout+label_smoothing,0.14,0.934593319893,0.24,0.92525357008,2.54,0.913899898529,19.32,0.898012518883,21.48,0.874219954014,21.79,0.838225066662,22,0.780564188957,22.23,0.696267008781,22.27,0.599454283714,22.2,0.501063108444,22.24,0.408145487309
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,400000,label_smoothing,0.06,0.93709808588,0.15,0.930160880089,0.86,0.921068370342,15.09,0.907396137714,20.8,0.885717391968,22.1,0.851082503796,22.6,0.79257529974,22.88,0.708025157452,22.83,0.612457215786,22.9,0.515732049942,22.99,0.423565655947
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,100000,400000,none,0,0.932762861252,0.27,0.925383090973,5.91,0.915521323681,19,0.90070271492,22.03,0.877667546272,23,0.84168022871,23.27,0.784208238125,23.43,0.700625777245,23.42,0.603319346905,23.37,0.504826486111,23.39,0.412347406149
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,400000,dropout+label_smoothing,6.91,0.836353957653,21.49,0.812901854515,23.71,0.781609356403,24.51,0.739076435566,24.64,0.682345271111,24.74,0.609795928001,24.79,0.521647274494,24.84,0.425698161125,24.76,0.338343381882,24.77,0.264213949442,24.72,0.203538268805
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,400000,label_smoothing,7.68,0.830482542515,19.64,0.81087988615,23.65,0.78356474638,24.78,0.744957566261,25.12,0.691197991371,25.2,0.61974298954,25.22,0.530677139759,25.33,0.435302227736,25.33,0.349522024393,25.33,0.276902973652,25.42,0.217028230429
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,400000,none,7.13,0.807768940926,21.63,0.78866404295,24.34,0.762012898922,25.04,0.723614513874,25.24,0.669404149055,25.36,0.597966849804,25.34,0.51166677475,25.3,0.418363839388,25.27,0.333391994238,25.29,0.262041538954,25.26,0.203889712691
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,400000,dropout+label_smoothing,0.64,0.86003100872,14.69,0.840062618256,23.34,0.812187194824,24.17,0.772177875042,24.35,0.717231094837,24.42,0.646173536777,24.58,0.559721767902,24.56,0.462832421064,24.61,0.372896283865,24.67,0.296829938889,24.7,0.234325200319
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,400000,label_smoothing,0.88,0.866805493832,12.05,0.850988805294,22.18,0.827263832092,24.02,0.791309535503,24.66,0.739703893661,24.8,0.67063242197,24.92,0.584394454956,24.93,0.488581508398,24.97,0.40125232935,24.94,0.327854216099,24.97,0.267253160477
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,400000,none,2.53,0.854529857635,17.31,0.83898639679,22.89,0.815278291702,24.36,0.778975248337,24.83,0.726510345936,25.08,0.656973361969,25.09,0.572851657867,25.08,0.479801654816,25.22,0.392509758472,25.17,0.319347262383,25.17,0.259612560272
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,400000,dropout+label_smoothing,22.42,0.795582354069,24.47,0.769875228405,25.08,0.737266659737,25.29,0.694915950298,25.33,0.638622641563,25.37,0.565288722515,25.39,0.4754306674,25.44,0.384359300137,25.42,0.302483439445,25.44,0.232987090945,25.41,0.176320537925
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,400000,label_smoothing,21.86,0.759576618671,24.54,0.737424969673,25.3,0.709211349487,25.54,0.671297550201,25.59,0.618651092052,25.54,0.547287285328,25.63,0.459614932537,25.73,0.37196585536,25.7,0.2936373353,25.71,0.227554515004,25.68,0.173805043101
sparse_transformer_variational_dropout,2.22222222222e-8,linear,100000,400000,none,22.69,0.70847004652,24.23,0.686977922916,24.67,0.660844147205,25.09,0.625324785709,25.18,0.574999392033,25.09,0.507585942745,25.27,0.425820380449,25.27,0.343221485615,25.13,0.269169986248,25.14,0.20690575242,25.28,0.156791448593
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,400000,dropout+label_smoothing,14.33,0.831612348557,23.15,0.807112693787,24.28,0.774623572826,24.6,0.731036484241,24.84,0.672921776772,24.86,0.597671806812,24.93,0.505525648594,24.96,0.410664737225,24.93,0.324985563755,24.97,0.251916229725,24.94,0.191932052374
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,400000,label_smoothing,10.76,0.824002146721,20.76,0.802559018135,23.97,0.773080587387,24.86,0.732375264168,25.23,0.676274418831,25.28,0.60148614645,25.32,0.508999705315,25.25,0.415085762739,25.33,0.33059990406,25.35,0.25858721137,25.44,0.199223220348
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,100000,400000,none,15.94,0.797921419144,21.86,0.776390194893,23.81,0.747356951237,24.54,0.706984341145,24.93,0.650893568993,24.95,0.577420055866,24.91,0.488719463348,24.93,0.39740088582,24.92,0.314759582281,24.99,0.244523733854,25.02,0.187190413475
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,500000,dropout+label_smoothing,0.15,0.968239963055,0.14,0.962478637695,0.22,0.956291973591,1.7,0.948956489563,16.83,0.938750803471,19.2,0.923035383224,19.69,0.897885024548,19.91,0.853673756123,19.98,0.782606840134,20.09,0.698345482349,20.16,0.611843585968
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,500000,label_smoothing,0.05,0.970399796963,0.04,0.966129660606,0.11,0.961344897747,1.9,0.955263435841,16.01,0.946172297001,19.74,0.931354999542,20.51,0.906268060207,20.82,0.860081493855,21,0.788737177849,21.07,0.708462655544,21.12,0.629163444042
sparse_transformer_variational_dropout,2.22222222222e-7,linear,0,500000,none,0.06,0.966827511787,0.13,0.962465107441,0.15,0.957548439503,1.95,0.951220273972,16.61,0.941586911678,19.98,0.925794124603,20.99,0.899479985237,21.32,0.853823125362,21.54,0.782235920429,21.52,0.698899209499,21.44,0.617192983627
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,500000,dropout+label_smoothing,0.11,0.975083649158,0.19,0.970926165581,0.2,0.966526687145,1.11,0.96120685339,14.01,0.953400433064,18.75,0.940573692322,19.12,0.919412434101,19.35,0.882446289062,19.36,0.818746805191,19.47,0.73666113615,19.52,0.652597367764
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,500000,label_smoothing,0.08,0.977666556835,0.1,0.974803626537,0.26,0.971586167812,2.4,0.967335939407,14.69,0.960447371006,18.85,0.948374032974,19.78,0.927471876144,20.21,0.889254808426,20.32,0.824357569218,20.43,0.746124446392,20.45,0.66969203949
sparse_transformer_variational_dropout,2.22222222222e-7,cubic,0,500000,none,0.1,0.974697589874,0,0.971714317799,0.16,0.96832627058,2.4,0.963726878166,16.9,0.956091165543,19.66,0.942736566067,20.5,0.919877171516,20.53,0.879856944084,20.66,0.814212560654,20.79,0.733658671379,20.81,0.655174970627
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,500000,dropout+label_smoothing,0.12,0.95714867115,0.19,0.949612259865,0.42,0.941403508186,6.18,0.93126809597,19.48,0.916721284389,20.56,0.894567668438,20.92,0.859938681126,21.02,0.801665008068,21.03,0.718710720539,21.05,0.628268897533,21.12,0.539614021778
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,500000,label_smoothing,0.05,0.959994018078,0,0.954392492771,0.18,0.94794690609,6.52,0.93946903944,18.56,0.926500618458,20.79,0.905879795551,21.49,0.871705114841,21.78,0.812376618385,21.91,0.731342017651,21.86,0.646448731422,21.92,0.56529301405
sparse_transformer_variational_dropout,1.55555555556e-7,linear,0,500000,none,0.05,0.95554882288,0.13,0.949925839901,0.92,0.94338285923,11.89,0.934580981731,19.91,0.92091178894,21.22,0.898998439312,21.6,0.863444685936,21.85,0.805059075356,21.84,0.723646223545,21.86,0.63691753149,21.85,0.555436193943
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,500000,dropout+label_smoothing,0.14,0.966168403625,0.2,0.960669517517,0.37,0.954721212387,2.69,0.947271108627,18,0.935967087746,19.86,0.917577505112,20.23,0.887833356857,20.3,0.837583124638,20.39,0.760124564171,20.4,0.672163844109,20.37,0.587543308735
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,500000,label_smoothing,0,0.969651281834,0,0.965563178062,0.15,0.960870683193,3,0.954502642155,17.47,0.944115698338,19.98,0.926467418671,20.72,0.896809875965,20.96,0.845076441765,21.08,0.768046736717,21.08,0.685639202595,21.11,0.609170675278
sparse_transformer_variational_dropout,1.55555555556e-7,cubic,0,500000,none,0.03,0.966357767582,0.04,0.962418556213,0.14,0.957802951336,3.01,0.951313078403,18,0.940433263779,20.8,0.921712577343,21.33,0.890510618687,21.58,0.838720619678,21.61,0.762020647526,21.75,0.677073717117,21.7,0.598494172096
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,500000,dropout+label_smoothing,0.14,0.933316230774,0.31,0.922418832779,5.52,0.909893929958,19.97,0.89335334301,21.85,0.869450032711,22.29,0.834414660931,22.45,0.781902968884,22.55,0.702459931374,22.54,0.607188045979,22.56,0.512862503529,22.55,0.425848841667
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,500000,label_smoothing,0,0.936715245247,0.09,0.928484678268,2.22,0.91845446825,17.57,0.904306292534,21.62,0.882708847523,22.5,0.849675953388,22.91,0.797721326351,23.01,0.719006538391,23.05,0.628573358059,23.02,0.541239500046,23.07,0.46152856946
sparse_transformer_variational_dropout,8.88888888889e-8,linear,0,500000,none,0.14,0.929913163185,1.5,0.92146641016,11.55,0.910987377167,20.18,0.896066606045,22.52,0.873521983624,23.02,0.839215993881,23.33,0.78664201498,23.42,0.709387898445,23.51,0.616886794567,23.48,0.527132034302,23.52,0.446486353874
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,500000,dropout+label_smoothing,0.32,0.946294844151,0.39,0.937905192375,1.87,0.928333103657,17.43,0.915308833122,20.89,0.895253956318,21.53,0.86432236433,21.72,0.817018866539,21.82,0.744235336781,21.89,0.650980114937,21.84,0.558360934258,21.83,0.474221855402
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,500000,label_smoothing,0.14,0.951812684536,0.23,0.945944547653,1.01,0.938768029213,13.44,0.92808753252,20.77,0.910228073597,22.12,0.88120418787,22.53,0.834877073765,22.67,0.762620091438,22.69,0.673964858055,22.8,0.589119195938,22.75,0.513683080673
sparse_transformer_variational_dropout,8.88888888889e-8,cubic,0,500000,none,0.06,0.947515308857,0.09,0.941599309444,0.93,0.934160768986,15.8,0.922844529152,21.4,0.903911173344,22.47,0.873248279095,22.76,0.825483560562,22.89,0.754500031471,22.96,0.665271341801,22.96,0.577972710133,22.97,0.501355111599
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,500000,dropout+label_smoothing,12.76,0.822247684002,22.31,0.798597574234,23.94,0.767202615738,24.42,0.725189566612,24.65,0.669285416603,24.82,0.597373247147,24.88,0.509600400925,24.95,0.414376914501,24.97,0.327882617712,24.97,0.25462859869,24.98,0.194725498557
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,500000,label_smoothing,13.25,0.808640241623,22.09,0.788923680782,24.36,0.761846363544,25.08,0.724220812321,25.29,0.671800494194,25.37,0.601498842239,25.52,0.513295948505,25.56,0.419498980045,25.55,0.335218280554,25.59,0.263851732016,25.56,0.205308184028
sparse_transformer_variational_dropout,2.22222222222e-8,linear,0,500000,none,17.71,0.780593812466,22.99,0.762048959732,24.56,0.736713409424,25.08,0.700374603271,25.26,0.648323178291,25.36,0.578863799572,25.22,0.493999779224,25.34,0.402708977461,25.24,0.319935232401,25.32,0.250548839569,25.27,0.194359347224
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,500000,dropout+label_smoothing,0.61,0.855018675327,14.75,0.834376633167,22.99,0.805820584297,23.93,0.765337467194,24.25,0.7100456357,24.2,0.638701975346,24.35,0.551932036877,24.39,0.455087035894,24.41,0.365378141403,24.47,0.289497196674,24.47,0.227100014687
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,500000,label_smoothing,0.84,0.859415471554,15.52,0.843000590801,22.85,0.818711698055,24.24,0.782423138618,24.69,0.730693995953,24.71,0.661504745483,25.01,0.574862062931,24.9,0.47896617651,24.92,0.391649067402,24.89,0.317929655313,24.91,0.256893157959
sparse_transformer_variational_dropout,2.22222222222e-8,cubic,0,500000,none,4.47,0.844593167305,19.26,0.828102588654,23.28,0.803496301174,24.56,0.766424298286,24.86,0.713069796562,24.96,0.642396271229,25.06,0.556817412376,25.11,0.462699472904,25.05,0.375076711178,25.04,0.301642179489,25.09,0.241609930992
